annotate src/de/mpiwg/dwinter/duomo/lexdump/LexOWLTransformer.java @ 5:923e73fa07f1

Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
author dwinter
date Mon, 07 Feb 2011 16:51:38 +0100
parents 72004a788198
children 30fc93374f10
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
fb3f3df002df first release
dwinter
parents:
diff changeset
1 package de.mpiwg.dwinter.duomo.lexdump;
fb3f3df002df first release
dwinter
parents:
diff changeset
2
1
dwinter
parents: 0
diff changeset
3 import java.io.File;
dwinter
parents: 0
diff changeset
4 import java.io.FileWriter;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
5 import java.io.IOException;
fb3f3df002df first release
dwinter
parents:
diff changeset
6 import java.net.URI;
fb3f3df002df first release
dwinter
parents:
diff changeset
7 import java.net.URISyntaxException;
fb3f3df002df first release
dwinter
parents:
diff changeset
8 import java.net.URLEncoder;
fb3f3df002df first release
dwinter
parents:
diff changeset
9 import java.util.Collection;
fb3f3df002df first release
dwinter
parents:
diff changeset
10 import java.util.HashMap;
fb3f3df002df first release
dwinter
parents:
diff changeset
11 import java.util.HashSet;
fb3f3df002df first release
dwinter
parents:
diff changeset
12 import java.util.Iterator;
fb3f3df002df first release
dwinter
parents:
diff changeset
13 import java.util.List;
fb3f3df002df first release
dwinter
parents:
diff changeset
14 import java.util.Map;
fb3f3df002df first release
dwinter
parents:
diff changeset
15 import java.util.Set;
fb3f3df002df first release
dwinter
parents:
diff changeset
16
fb3f3df002df first release
dwinter
parents:
diff changeset
17 import javax.print.URIException;
fb3f3df002df first release
dwinter
parents:
diff changeset
18
fb3f3df002df first release
dwinter
parents:
diff changeset
19 import org.apache.log4j.Level;
fb3f3df002df first release
dwinter
parents:
diff changeset
20 import org.apache.log4j.Logger;
fb3f3df002df first release
dwinter
parents:
diff changeset
21 import org.jdom.Attribute;
fb3f3df002df first release
dwinter
parents:
diff changeset
22 import org.jdom.Element;
fb3f3df002df first release
dwinter
parents:
diff changeset
23 import org.jdom.JDOMException;
fb3f3df002df first release
dwinter
parents:
diff changeset
24 import org.jdom.xpath.XPath;
fb3f3df002df first release
dwinter
parents:
diff changeset
25
fb3f3df002df first release
dwinter
parents:
diff changeset
26 import com.sun.xml.internal.ws.developer.MemberSubmissionEndpointReference.Elements;
fb3f3df002df first release
dwinter
parents:
diff changeset
27
fb3f3df002df first release
dwinter
parents:
diff changeset
28 import edu.stanford.smi.protege.exception.OntologyLoadException;
fb3f3df002df first release
dwinter
parents:
diff changeset
29 import edu.stanford.smi.protege.model.Instance;
4
72004a788198 save single file
dwinter
parents: 3
diff changeset
30 import edu.stanford.smi.protegex.owl.jena.JenaOWLModel;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
31 import edu.stanford.smi.protegex.owl.model.OWLAllValuesFrom;
fb3f3df002df first release
dwinter
parents:
diff changeset
32 import edu.stanford.smi.protegex.owl.model.OWLClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
33 import edu.stanford.smi.protegex.owl.model.OWLDataRange;
fb3f3df002df first release
dwinter
parents:
diff changeset
34 import edu.stanford.smi.protegex.owl.model.OWLIndividual;
fb3f3df002df first release
dwinter
parents:
diff changeset
35 import edu.stanford.smi.protegex.owl.model.OWLNamedClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
36 import edu.stanford.smi.protegex.owl.model.OWLProperty;
fb3f3df002df first release
dwinter
parents:
diff changeset
37 import edu.stanford.smi.protegex.owl.model.OWLUnionClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
38 import edu.stanford.smi.protegex.owl.model.RDFList;
fb3f3df002df first release
dwinter
parents:
diff changeset
39 import edu.stanford.smi.protegex.owl.model.RDFProperty;
fb3f3df002df first release
dwinter
parents:
diff changeset
40 import edu.stanford.smi.protegex.owl.model.RDFResource;
fb3f3df002df first release
dwinter
parents:
diff changeset
41 import edu.stanford.smi.protegex.owl.model.impl.AbstractOWLQuantifierRestriction;
fb3f3df002df first release
dwinter
parents:
diff changeset
42 import edu.stanford.smi.protegex.owl.model.impl.DefaultOWLUnionClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
43
fb3f3df002df first release
dwinter
parents:
diff changeset
44 public class LexOWLTransformer {
fb3f3df002df first release
dwinter
parents:
diff changeset
45 private Logger logger = Logger.getRootLogger();
1
dwinter
parents: 0
diff changeset
46 private FileWriter missing;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
47 private OWLImporter owlDoc;
fb3f3df002df first release
dwinter
parents:
diff changeset
48 private LexDumpImporter lexDoc;
fb3f3df002df first release
dwinter
parents:
diff changeset
49 private Map<String, OWLIndividual> individualIds = new HashMap<String, OWLIndividual>(); // speichere
fb3f3df002df first release
dwinter
parents:
diff changeset
50 // ids
fb3f3df002df first release
dwinter
parents:
diff changeset
51 // fuer
fb3f3df002df first release
dwinter
parents:
diff changeset
52 // weitere
fb3f3df002df first release
dwinter
parents:
diff changeset
53 // Verwendung
fb3f3df002df first release
dwinter
parents:
diff changeset
54
1
dwinter
parents: 0
diff changeset
55 public LexOWLTransformer(OWLImporter owlDoc, LexDumpImporter lexDoc) throws IOException {
0
fb3f3df002df first release
dwinter
parents:
diff changeset
56 this.owlDoc = owlDoc;
fb3f3df002df first release
dwinter
parents:
diff changeset
57 this.lexDoc = lexDoc;
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
58 missing = new FileWriter(new File("/tmp/missing.out"));
0
fb3f3df002df first release
dwinter
parents:
diff changeset
59 }
fb3f3df002df first release
dwinter
parents:
diff changeset
60
fb3f3df002df first release
dwinter
parents:
diff changeset
61 /**
fb3f3df002df first release
dwinter
parents:
diff changeset
62 * @param args
fb3f3df002df first release
dwinter
parents:
diff changeset
63 * @throws Exception
fb3f3df002df first release
dwinter
parents:
diff changeset
64 */
fb3f3df002df first release
dwinter
parents:
diff changeset
65 public static void main(String[] args) throws Exception {
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
66 System.out.println("Stack size has to be large, use at lease -Xss=2024k!");
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
67 if (args.length<2){
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
68 System.out.println("Usage: \"/Users/dwinter/Documents/Projekte/Diss - data-mining/eclipseWorkspace/de.mpiwg.dwinter.duomo/owlInput\""+
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
69 "\"/Users/dwinter/Documents/Projekte/Diss - data-mining/eclipseWorkspace/duomoData/LEXXDUMP.xml\"");
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
70 System.exit(-1);
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
71 }
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
72
0
fb3f3df002df first release
dwinter
parents:
diff changeset
73 Logger.getRootLogger().setLevel(Level.DEBUG);
fb3f3df002df first release
dwinter
parents:
diff changeset
74 // Import OWL
fb3f3df002df first release
dwinter
parents:
diff changeset
75 //String base = "/Users/dwinter/Documents/Projekte/Diss - data-mining/eclipseWorkspace/de.mpiwg.dwinter.duomo/owlInput";
fb3f3df002df first release
dwinter
parents:
diff changeset
76 String base=args[0];
fb3f3df002df first release
dwinter
parents:
diff changeset
77 String baseUri= base.replace(" ", "%20");
fb3f3df002df first release
dwinter
parents:
diff changeset
78 URI ontologieUri = new URI("file://"+baseUri+"/duomoAnalysis.owl");
fb3f3df002df first release
dwinter
parents:
diff changeset
79 //URI ontologieUri = new URI(
fb3f3df002df first release
dwinter
parents:
diff changeset
80 // "file:///Users/dwinter/Documents/Projekte/Diss%20-%20data-mining/eclipseWorkspace/de.mpiwg.dwinter.duomo/owlInput/duomoAnalysis.owl");
fb3f3df002df first release
dwinter
parents:
diff changeset
81 OWLImporter owlDoc = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
82 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
83
fb3f3df002df first release
dwinter
parents:
diff changeset
84 owlDoc = new OWLImporter(base, ontologieUri);
fb3f3df002df first release
dwinter
parents:
diff changeset
85 // owlDoc.printModel();
fb3f3df002df first release
dwinter
parents:
diff changeset
86 } catch (OntologyLoadException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
87 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
88 System.exit(-1);
fb3f3df002df first release
dwinter
parents:
diff changeset
89 }
fb3f3df002df first release
dwinter
parents:
diff changeset
90 // read and parse lexfile
fb3f3df002df first release
dwinter
parents:
diff changeset
91 //String lexFile = "/Users/dwinter/Documents/Projekte/Diss - data-mining/eclipseWorkspace/duomoData/LEXXDUMP.xml";
fb3f3df002df first release
dwinter
parents:
diff changeset
92 String lexFile=args[1];
fb3f3df002df first release
dwinter
parents:
diff changeset
93 LexDumpImporter lexDoc = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
94 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
95 lexDoc = new LexDumpImporter(lexFile);
fb3f3df002df first release
dwinter
parents:
diff changeset
96 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
97 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
98 System.exit(-1);
fb3f3df002df first release
dwinter
parents:
diff changeset
99 } catch (IOException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
100 System.exit(-1);
fb3f3df002df first release
dwinter
parents:
diff changeset
101 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
102 }
fb3f3df002df first release
dwinter
parents:
diff changeset
103
fb3f3df002df first release
dwinter
parents:
diff changeset
104 // List<Element> cartas = lexDoc.getCartas();
fb3f3df002df first release
dwinter
parents:
diff changeset
105 // System.out.println(cartas.size());
fb3f3df002df first release
dwinter
parents:
diff changeset
106
fb3f3df002df first release
dwinter
parents:
diff changeset
107 LexOWLTransformer tf = new LexOWLTransformer(owlDoc, lexDoc);
fb3f3df002df first release
dwinter
parents:
diff changeset
108 tf.transform();
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
109 owlDoc.save("file:///tmp/out.owl");
0
fb3f3df002df first release
dwinter
parents:
diff changeset
110 }
fb3f3df002df first release
dwinter
parents:
diff changeset
111
4
72004a788198 save single file
dwinter
parents: 3
diff changeset
112 private void transform() throws URISyntaxException, Exception {
0
fb3f3df002df first release
dwinter
parents:
diff changeset
113 List<Element> signatures = lexDoc.getSignatures();
fb3f3df002df first release
dwinter
parents:
diff changeset
114
fb3f3df002df first release
dwinter
parents:
diff changeset
115 // Element signature = signatures.get(0);
4
72004a788198 save single file
dwinter
parents: 3
diff changeset
116 int signatureCount = 0;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
117 int maxsign = signatures.size();
fb3f3df002df first release
dwinter
parents:
diff changeset
118 for (Element signature : signatures) {
fb3f3df002df first release
dwinter
parents:
diff changeset
119 logger.debug(String.format("Signature: %s (%s)", signatureCount,
fb3f3df002df first release
dwinter
parents:
diff changeset
120 maxsign));
4
72004a788198 save single file
dwinter
parents: 3
diff changeset
121
72004a788198 save single file
dwinter
parents: 3
diff changeset
122 signatureCount++;
72004a788198 save single file
dwinter
parents: 3
diff changeset
123 //if (signatureCount<5 || signatureCount>10)
72004a788198 save single file
dwinter
parents: 3
diff changeset
124 // continue;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
125 OWLIndividual signatureInd = createSignature(signature);
fb3f3df002df first release
dwinter
parents:
diff changeset
126
fb3f3df002df first release
dwinter
parents:
diff changeset
127 @SuppressWarnings("unchecked")
fb3f3df002df first release
dwinter
parents:
diff changeset
128 List<Element> cards = XPath.selectNodes(signature, ".//carta");
fb3f3df002df first release
dwinter
parents:
diff changeset
129 int cardsCount = 1;
fb3f3df002df first release
dwinter
parents:
diff changeset
130 int maxcards = cards.size();
fb3f3df002df first release
dwinter
parents:
diff changeset
131
fb3f3df002df first release
dwinter
parents:
diff changeset
132 // Element card=cards.get(0);
fb3f3df002df first release
dwinter
parents:
diff changeset
133 for (Element card : cards) {
fb3f3df002df first release
dwinter
parents:
diff changeset
134 logger.debug(String.format("Cards: %s (%s)", cardsCount++,
fb3f3df002df first release
dwinter
parents:
diff changeset
135 maxcards));
fb3f3df002df first release
dwinter
parents:
diff changeset
136 logger.debug(String.format("Signature: %s (%s)",
fb3f3df002df first release
dwinter
parents:
diff changeset
137 signatureCount, maxsign));
fb3f3df002df first release
dwinter
parents:
diff changeset
138 OWLIndividual cardInd = createCard(card, signatureInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
139
fb3f3df002df first release
dwinter
parents:
diff changeset
140 @SuppressWarnings("unchecked")
fb3f3df002df first release
dwinter
parents:
diff changeset
141 List<Element> records = XPath.selectNodes(card, ".//record");
fb3f3df002df first release
dwinter
parents:
diff changeset
142 for (Element record : records) {
fb3f3df002df first release
dwinter
parents:
diff changeset
143 // Element record = records.get(0);
fb3f3df002df first release
dwinter
parents:
diff changeset
144 OWLIndividual recordInd = createRecord(record, cardInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
145 OWLIndividual recordEvent = createEvent(record, recordInd); // Event
fb3f3df002df first release
dwinter
parents:
diff changeset
146 // und
fb3f3df002df first release
dwinter
parents:
diff changeset
147 // Records
fb3f3df002df first release
dwinter
parents:
diff changeset
148 // sind
fb3f3df002df first release
dwinter
parents:
diff changeset
149 // im
fb3f3df002df first release
dwinter
parents:
diff changeset
150 // Original
fb3f3df002df first release
dwinter
parents:
diff changeset
151 // im
fb3f3df002df first release
dwinter
parents:
diff changeset
152 // record-tag
fb3f3df002df first release
dwinter
parents:
diff changeset
153 }
fb3f3df002df first release
dwinter
parents:
diff changeset
154 }
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
155 //owlDoc.save("file:///tmp/out"+String.valueOf(signatureCount)+".owl");
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
156 //logger.debug("Saved:"+"/tmp/out"+String.valueOf(signatureCount)+".owl");
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
157 //owlDoc.reloadOWL();
0
fb3f3df002df first release
dwinter
parents:
diff changeset
158 }
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
159 owlDoc.printModel();
0
fb3f3df002df first release
dwinter
parents:
diff changeset
160 }
fb3f3df002df first release
dwinter
parents:
diff changeset
161
fb3f3df002df first release
dwinter
parents:
diff changeset
162 private OWLIndividual createEvent(Element record, OWLIndividual recordInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
163
fb3f3df002df first release
dwinter
parents:
diff changeset
164 logger.debug("Create Event");
fb3f3df002df first release
dwinter
parents:
diff changeset
165 OWLIndividual eventInstance = owlDoc.createInstance("RecordedEvent");
fb3f3df002df first release
dwinter
parents:
diff changeset
166
fb3f3df002df first release
dwinter
parents:
diff changeset
167 owlDoc.setProperty(recordInd, "crm:P70_documents", eventInstance);
fb3f3df002df first release
dwinter
parents:
diff changeset
168
fb3f3df002df first release
dwinter
parents:
diff changeset
169 // timespan
fb3f3df002df first release
dwinter
parents:
diff changeset
170
fb3f3df002df first release
dwinter
parents:
diff changeset
171 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
172 String dateDcStart = lexDoc.getValue(record, ".//datdf/startdate");
fb3f3df002df first release
dwinter
parents:
diff changeset
173
fb3f3df002df first release
dwinter
parents:
diff changeset
174 String dateDcEnd = lexDoc.getValue(record, ".//datdf/startdate");
fb3f3df002df first release
dwinter
parents:
diff changeset
175
fb3f3df002df first release
dwinter
parents:
diff changeset
176 if (!dateDcStart.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
177 OWLIndividual timeSpan = owlDoc.createTimeSpan(dateDcStart,
fb3f3df002df first release
dwinter
parents:
diff changeset
178 dateDcEnd);
fb3f3df002df first release
dwinter
parents:
diff changeset
179 owlDoc.setProperty(eventInstance, "crm:P4_has_time-span",
fb3f3df002df first release
dwinter
parents:
diff changeset
180 timeSpan);
fb3f3df002df first release
dwinter
parents:
diff changeset
181 }
fb3f3df002df first release
dwinter
parents:
diff changeset
182 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
183 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
184 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
185 }
fb3f3df002df first release
dwinter
parents:
diff changeset
186
fb3f3df002df first release
dwinter
parents:
diff changeset
187 // tipol
fb3f3df002df first release
dwinter
parents:
diff changeset
188 String typology;
fb3f3df002df first release
dwinter
parents:
diff changeset
189 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
190 typology = lexDoc.getValue(record, ".//tipol");
fb3f3df002df first release
dwinter
parents:
diff changeset
191 OWLIndividual typolInd = createOrGetTipol(typology);
fb3f3df002df first release
dwinter
parents:
diff changeset
192 owlDoc.setProperty(eventInstance, "has_tipol", typolInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
193
fb3f3df002df first release
dwinter
parents:
diff changeset
194 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
195 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
196 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
197 }
fb3f3df002df first release
dwinter
parents:
diff changeset
198
fb3f3df002df first release
dwinter
parents:
diff changeset
199 // reges
fb3f3df002df first release
dwinter
parents:
diff changeset
200 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
201 createNewDependingDataTypePropertyFromXpath(record, eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
202 ".//reges/italian", "has_reges", "it");
fb3f3df002df first release
dwinter
parents:
diff changeset
203 createNewDependingDataTypePropertyFromXpath(record, eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
204 ".//reges/english", "has_reges", "en");
fb3f3df002df first release
dwinter
parents:
diff changeset
205 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
206 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
207 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
208 }
fb3f3df002df first release
dwinter
parents:
diff changeset
209
fb3f3df002df first release
dwinter
parents:
diff changeset
210 // nomiq
fb3f3df002df first release
dwinter
parents:
diff changeset
211
fb3f3df002df first release
dwinter
parents:
diff changeset
212 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
213 @SuppressWarnings("unchecked")
fb3f3df002df first release
dwinter
parents:
diff changeset
214 List<Element> nomiqs = XPath.selectNodes(record, ".//nomiq");
fb3f3df002df first release
dwinter
parents:
diff changeset
215 OWLIndividual recordNamesRoles = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
216 for (Element nomiq : nomiqs) {
fb3f3df002df first release
dwinter
parents:
diff changeset
217 String name = lexDoc.getValue(nomiq, "./name");
fb3f3df002df first release
dwinter
parents:
diff changeset
218 String role = lexDoc.getValue(nomiq, "./role");
fb3f3df002df first release
dwinter
parents:
diff changeset
219
fb3f3df002df first release
dwinter
parents:
diff changeset
220 if (!name.equals("") && !role.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
221 recordNamesRoles = handleNameWithRole(recordInd, name, role);
fb3f3df002df first release
dwinter
parents:
diff changeset
222 } else if (!role.equals("")) {
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
223 recordNamesRoles = createOrGetRole(role);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
224 } else if (!name.equals("")) {
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
225 recordNamesRoles = createOrGetName(name);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
226 }
fb3f3df002df first release
dwinter
parents:
diff changeset
227
fb3f3df002df first release
dwinter
parents:
diff changeset
228 if (recordNamesRoles != null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
229 owlDoc.setProperty(eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
230 "recordsDuomoObjectNameRoles", recordNamesRoles);
fb3f3df002df first release
dwinter
parents:
diff changeset
231 String id = lexDoc.getValue(nomiq, "./@id");
fb3f3df002df first release
dwinter
parents:
diff changeset
232 individualIds.put(id, recordNamesRoles);
fb3f3df002df first release
dwinter
parents:
diff changeset
233 }
fb3f3df002df first release
dwinter
parents:
diff changeset
234 }
fb3f3df002df first release
dwinter
parents:
diff changeset
235
fb3f3df002df first release
dwinter
parents:
diff changeset
236 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
237 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
238 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
239 }
fb3f3df002df first release
dwinter
parents:
diff changeset
240
fb3f3df002df first release
dwinter
parents:
diff changeset
241 // istit
fb3f3df002df first release
dwinter
parents:
diff changeset
242 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
243 String istit = lexDoc.getValue(record, "./istit");
fb3f3df002df first release
dwinter
parents:
diff changeset
244 OWLIndividual istitInd = owlDoc.getIndividualByReadableId(
fb3f3df002df first release
dwinter
parents:
diff changeset
245 "IndicesInstitutions", istit);
fb3f3df002df first release
dwinter
parents:
diff changeset
246 if (istitInd == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
247 istitInd = createOrGetInstitution(istit);
fb3f3df002df first release
dwinter
parents:
diff changeset
248 }
fb3f3df002df first release
dwinter
parents:
diff changeset
249
fb3f3df002df first release
dwinter
parents:
diff changeset
250 owlDoc.setProperty(eventInstance, "recordsDuomoObjectInstitution",
fb3f3df002df first release
dwinter
parents:
diff changeset
251 istitInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
252
fb3f3df002df first release
dwinter
parents:
diff changeset
253 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
254 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
255 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
256 }
fb3f3df002df first release
dwinter
parents:
diff changeset
257
fb3f3df002df first release
dwinter
parents:
diff changeset
258 // types
fb3f3df002df first release
dwinter
parents:
diff changeset
259
fb3f3df002df first release
dwinter
parents:
diff changeset
260 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
261 List<Element> types = XPath.selectNodes(record, ".//type");
fb3f3df002df first release
dwinter
parents:
diff changeset
262 for (Element type : types) {
fb3f3df002df first release
dwinter
parents:
diff changeset
263 createType(eventInstance, type);
fb3f3df002df first release
dwinter
parents:
diff changeset
264 }
fb3f3df002df first release
dwinter
parents:
diff changeset
265 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
266 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
267 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
268 }
fb3f3df002df first release
dwinter
parents:
diff changeset
269
fb3f3df002df first release
dwinter
parents:
diff changeset
270 return eventInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
271 }
fb3f3df002df first release
dwinter
parents:
diff changeset
272
fb3f3df002df first release
dwinter
parents:
diff changeset
273 private void createType(OWLIndividual eventInstance, Element type) {
fb3f3df002df first release
dwinter
parents:
diff changeset
274
fb3f3df002df first release
dwinter
parents:
diff changeset
275 String typeId;
fb3f3df002df first release
dwinter
parents:
diff changeset
276 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
277 typeId = lexDoc.getValue(type, "./ptr/@target");
fb3f3df002df first release
dwinter
parents:
diff changeset
278 String clsName = owlDoc.getClassNameFromTypeId(typeId);
fb3f3df002df first release
dwinter
parents:
diff changeset
279 OWLNamedClass cls = owlDoc.getClassFromTypeId(typeId);
fb3f3df002df first release
dwinter
parents:
diff changeset
280 OWLIndividual typeInd = owlDoc.createInstance(clsName);
fb3f3df002df first release
dwinter
parents:
diff changeset
281
fb3f3df002df first release
dwinter
parents:
diff changeset
282 OWLNamedClass subjectClass = getPreferredTargetClass(cls,
fb3f3df002df first release
dwinter
parents:
diff changeset
283 "has_subject");
fb3f3df002df first release
dwinter
parents:
diff changeset
284 OWLNamedClass predicateClass = getPreferredTargetClass(cls,
fb3f3df002df first release
dwinter
parents:
diff changeset
285 "has_predicate");
fb3f3df002df first release
dwinter
parents:
diff changeset
286
fb3f3df002df first release
dwinter
parents:
diff changeset
287 List<Element> freeTexts = XPath.selectNodes(type, "./freetext");
fb3f3df002df first release
dwinter
parents:
diff changeset
288 for (Element freeText : freeTexts) {
fb3f3df002df first release
dwinter
parents:
diff changeset
289
fb3f3df002df first release
dwinter
parents:
diff changeset
290 String subjPointer = lexDoc.getValue(freeText,
fb3f3df002df first release
dwinter
parents:
diff changeset
291 "./sub/ptrtoperson/@target");
fb3f3df002df first release
dwinter
parents:
diff changeset
292 String subjText = lexDoc.getValue(freeText, "./sub");
fb3f3df002df first release
dwinter
parents:
diff changeset
293
fb3f3df002df first release
dwinter
parents:
diff changeset
294 OWLIndividual subjInd = createSubjectOrPredicate(subjectClass,
fb3f3df002df first release
dwinter
parents:
diff changeset
295 subjPointer, subjText);
fb3f3df002df first release
dwinter
parents:
diff changeset
296
fb3f3df002df first release
dwinter
parents:
diff changeset
297 String predPointer = lexDoc.getValue(freeText,
fb3f3df002df first release
dwinter
parents:
diff changeset
298 "./pred/ptrtoperson/@target");
fb3f3df002df first release
dwinter
parents:
diff changeset
299 String predText = lexDoc.getValue(freeText, "./pred");
fb3f3df002df first release
dwinter
parents:
diff changeset
300
fb3f3df002df first release
dwinter
parents:
diff changeset
301 OWLIndividual predInd = createSubjectOrPredicate(
fb3f3df002df first release
dwinter
parents:
diff changeset
302 predicateClass, predPointer, predText);
fb3f3df002df first release
dwinter
parents:
diff changeset
303
fb3f3df002df first release
dwinter
parents:
diff changeset
304 if (subjInd != null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
305 owlDoc.setProperty(typeInd, "has_subject", subjInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
306 }
fb3f3df002df first release
dwinter
parents:
diff changeset
307
fb3f3df002df first release
dwinter
parents:
diff changeset
308 if (predInd != null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
309 owlDoc.setProperty(typeInd, "has_predicate", predInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
310 }
fb3f3df002df first release
dwinter
parents:
diff changeset
311
fb3f3df002df first release
dwinter
parents:
diff changeset
312 owlDoc.setProperty(eventInstance, "recordsDuomoObjectConcept",
fb3f3df002df first release
dwinter
parents:
diff changeset
313 typeInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
314 }
fb3f3df002df first release
dwinter
parents:
diff changeset
315
fb3f3df002df first release
dwinter
parents:
diff changeset
316 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
317 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
318 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
319 }
fb3f3df002df first release
dwinter
parents:
diff changeset
320
fb3f3df002df first release
dwinter
parents:
diff changeset
321 }
fb3f3df002df first release
dwinter
parents:
diff changeset
322
fb3f3df002df first release
dwinter
parents:
diff changeset
323 private OWLIndividual createSubjectOrPredicate(OWLNamedClass toClass,
fb3f3df002df first release
dwinter
parents:
diff changeset
324 String subjPointer, String subjText) {
fb3f3df002df first release
dwinter
parents:
diff changeset
325 OWLIndividual subjInd = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
326
fb3f3df002df first release
dwinter
parents:
diff changeset
327 if (!subjPointer.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
328 subjInd = toClass.createOWLIndividual(null);
fb3f3df002df first release
dwinter
parents:
diff changeset
329 OWLIndividual ind = individualIds.get(subjPointer);
fb3f3df002df first release
dwinter
parents:
diff changeset
330 if (ind == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
331 logger.debug("target ID does not exist:" + subjPointer);
1
dwinter
parents: 0
diff changeset
332 try {
dwinter
parents: 0
diff changeset
333 missing.write("target ID does not exist:" + subjPointer+"\n");
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
334 missing.flush();
1
dwinter
parents: 0
diff changeset
335 } catch (IOException e) {
dwinter
parents: 0
diff changeset
336 // TODO Auto-generated catch block
dwinter
parents: 0
diff changeset
337 e.printStackTrace();
dwinter
parents: 0
diff changeset
338 }
0
fb3f3df002df first release
dwinter
parents:
diff changeset
339 } else {
fb3f3df002df first release
dwinter
parents:
diff changeset
340 owlDoc.setProperty(subjInd, "has_NameOrRoleFromIndex", ind);
fb3f3df002df first release
dwinter
parents:
diff changeset
341 }
fb3f3df002df first release
dwinter
parents:
diff changeset
342 }
fb3f3df002df first release
dwinter
parents:
diff changeset
343
fb3f3df002df first release
dwinter
parents:
diff changeset
344 if (!subjText.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
345 if (subjInd == null)
fb3f3df002df first release
dwinter
parents:
diff changeset
346 subjInd = toClass.createOWLIndividual(null);
fb3f3df002df first release
dwinter
parents:
diff changeset
347
fb3f3df002df first release
dwinter
parents:
diff changeset
348 OWLNamedClass idcls = owlDoc.owlModel
fb3f3df002df first release
dwinter
parents:
diff changeset
349 .getOWLNamedClass("Identifier"); // is die klasse selbst
fb3f3df002df first release
dwinter
parents:
diff changeset
350 // schon ein identifiert
fb3f3df002df first release
dwinter
parents:
diff changeset
351 if (toClass.getNamedSuperclasses(true).contains(idcls)) { // to
fb3f3df002df first release
dwinter
parents:
diff changeset
352 owlDoc.setProperty(subjInd, "has_readable_id", subjText);
fb3f3df002df first release
dwinter
parents:
diff changeset
353 } else {
fb3f3df002df first release
dwinter
parents:
diff changeset
354
fb3f3df002df first release
dwinter
parents:
diff changeset
355 OWLIndividual ident = owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
356 .createInstance("IdentifierPredicateOrSubject");
fb3f3df002df first release
dwinter
parents:
diff changeset
357 owlDoc.setProperty(ident, "has_readable_id", subjText);
fb3f3df002df first release
dwinter
parents:
diff changeset
358 owlDoc.setProperty(subjInd, "crm:P48_has_preferred_identifier",
fb3f3df002df first release
dwinter
parents:
diff changeset
359 ident);
fb3f3df002df first release
dwinter
parents:
diff changeset
360 }
fb3f3df002df first release
dwinter
parents:
diff changeset
361 }
fb3f3df002df first release
dwinter
parents:
diff changeset
362 return subjInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
363 }
fb3f3df002df first release
dwinter
parents:
diff changeset
364
fb3f3df002df first release
dwinter
parents:
diff changeset
365 private OWLNamedClass getPreferredTargetClass(OWLNamedClass cls,
fb3f3df002df first release
dwinter
parents:
diff changeset
366 String propertyName) {
fb3f3df002df first release
dwinter
parents:
diff changeset
367 RDFProperty prop = owlDoc.owlModel.getRDFProperty(propertyName);
fb3f3df002df first release
dwinter
parents:
diff changeset
368
fb3f3df002df first release
dwinter
parents:
diff changeset
369 // finde welche klasse als subject erlaubt ist
fb3f3df002df first release
dwinter
parents:
diff changeset
370 Collection<?> restrictions = cls.getRestrictions(prop, true);
fb3f3df002df first release
dwinter
parents:
diff changeset
371
fb3f3df002df first release
dwinter
parents:
diff changeset
372 RDFResource restrictionValues = prop.getRange(); // nimm erstmal den
fb3f3df002df first release
dwinter
parents:
diff changeset
373 // gesammten Range
fb3f3df002df first release
dwinter
parents:
diff changeset
374
fb3f3df002df first release
dwinter
parents:
diff changeset
375 // schaue jetzt nach ob eb es einschraenkungen gibt.
fb3f3df002df first release
dwinter
parents:
diff changeset
376 for (Iterator<?> it = restrictions.iterator(); it.hasNext();) {
fb3f3df002df first release
dwinter
parents:
diff changeset
377 Object restriction = it.next();
fb3f3df002df first release
dwinter
parents:
diff changeset
378 if (OWLAllValuesFrom.class.isInstance(restriction)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
379 OWLAllValuesFrom ar = (OWLAllValuesFrom) restriction;
fb3f3df002df first release
dwinter
parents:
diff changeset
380 restrictionValues = ar.getAllValuesFrom();
fb3f3df002df first release
dwinter
parents:
diff changeset
381 break;
fb3f3df002df first release
dwinter
parents:
diff changeset
382 }
fb3f3df002df first release
dwinter
parents:
diff changeset
383
fb3f3df002df first release
dwinter
parents:
diff changeset
384 }
fb3f3df002df first release
dwinter
parents:
diff changeset
385 OWLNamedClass toClass = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
386 if (OWLNamedClass.class.isInstance(restrictionValues)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
387 toClass = (OWLNamedClass) restrictionValues;
fb3f3df002df first release
dwinter
parents:
diff changeset
388 } else if (OWLDataRange.class.isInstance(restrictionValues)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
389 RDFList dr = ((OWLDataRange) restrictionValues).getOneOf();
fb3f3df002df first release
dwinter
parents:
diff changeset
390 for (Object d : dr.getValues()) {
fb3f3df002df first release
dwinter
parents:
diff changeset
391 System.out.println(d);
fb3f3df002df first release
dwinter
parents:
diff changeset
392 toClass = (OWLNamedClass) d;
fb3f3df002df first release
dwinter
parents:
diff changeset
393 // FIXME: geht das??
fb3f3df002df first release
dwinter
parents:
diff changeset
394 }
fb3f3df002df first release
dwinter
parents:
diff changeset
395 } else if (DefaultOWLUnionClass.class.isInstance(restrictionValues)) { // mehr
fb3f3df002df first release
dwinter
parents:
diff changeset
396 // als
fb3f3df002df first release
dwinter
parents:
diff changeset
397 // eine
fb3f3df002df first release
dwinter
parents:
diff changeset
398 // moeglich
fb3f3df002df first release
dwinter
parents:
diff changeset
399 DefaultOWLUnionClass ou = (DefaultOWLUnionClass) restrictionValues;
fb3f3df002df first release
dwinter
parents:
diff changeset
400 Set set = new HashSet();
fb3f3df002df first release
dwinter
parents:
diff changeset
401 ou.getNestedNamedClasses(set);
fb3f3df002df first release
dwinter
parents:
diff changeset
402
fb3f3df002df first release
dwinter
parents:
diff changeset
403 for (Iterator<?> it = set.iterator(); it.hasNext();) {
fb3f3df002df first release
dwinter
parents:
diff changeset
404 OWLNamedClass cl = (OWLNamedClass) it.next();
fb3f3df002df first release
dwinter
parents:
diff changeset
405 OWLNamedClass idcls = owlDoc.owlModel
fb3f3df002df first release
dwinter
parents:
diff changeset
406 .getOWLNamedClass("Identifier"); // nimm die Klasse die
fb3f3df002df first release
dwinter
parents:
diff changeset
407 // ein Identifier
fb3f3df002df first release
dwinter
parents:
diff changeset
408 // ist.
fb3f3df002df first release
dwinter
parents:
diff changeset
409 if (cl.getNamedSuperclasses(true).contains(idcls)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
410 toClass = cl;
fb3f3df002df first release
dwinter
parents:
diff changeset
411 break;
fb3f3df002df first release
dwinter
parents:
diff changeset
412 }
fb3f3df002df first release
dwinter
parents:
diff changeset
413
fb3f3df002df first release
dwinter
parents:
diff changeset
414 }
fb3f3df002df first release
dwinter
parents:
diff changeset
415 }
fb3f3df002df first release
dwinter
parents:
diff changeset
416 return toClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
417 }
fb3f3df002df first release
dwinter
parents:
diff changeset
418
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
419
0
fb3f3df002df first release
dwinter
parents:
diff changeset
420
fb3f3df002df first release
dwinter
parents:
diff changeset
421 private OWLIndividual handleNameWithRole(OWLIndividual recordInd,
fb3f3df002df first release
dwinter
parents:
diff changeset
422 String name, String role) {
fb3f3df002df first release
dwinter
parents:
diff changeset
423 // teste ob schon ein solcer Eintrag existiert
fb3f3df002df first release
dwinter
parents:
diff changeset
424 OWLIndividual nameInd = owlDoc.getIndividualByReadableId(
fb3f3df002df first release
dwinter
parents:
diff changeset
425 "IndicesNames", name);
fb3f3df002df first release
dwinter
parents:
diff changeset
426 Boolean createNewNameWithRole = false;
fb3f3df002df first release
dwinter
parents:
diff changeset
427 if (nameInd == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
428 nameInd = createOrGetName(name);
fb3f3df002df first release
dwinter
parents:
diff changeset
429 createNewNameWithRole = true; // name existierte nicht dann kann
fb3f3df002df first release
dwinter
parents:
diff changeset
430 // auch NameWithRole nicht
fb3f3df002df first release
dwinter
parents:
diff changeset
431 // existierten.
fb3f3df002df first release
dwinter
parents:
diff changeset
432 }
fb3f3df002df first release
dwinter
parents:
diff changeset
433 OWLIndividual roleInd = owlDoc.getIndividualByReadableId(
fb3f3df002df first release
dwinter
parents:
diff changeset
434 "IndicesRoles", role);
fb3f3df002df first release
dwinter
parents:
diff changeset
435 if (roleInd == null) {
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
436 roleInd = createOrGetRole(role);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
437 createNewNameWithRole = true; // role existierte nicht dann kann
fb3f3df002df first release
dwinter
parents:
diff changeset
438 // auch NameWithRole nicht
fb3f3df002df first release
dwinter
parents:
diff changeset
439 // existierten.
fb3f3df002df first release
dwinter
parents:
diff changeset
440 }
fb3f3df002df first release
dwinter
parents:
diff changeset
441 OWLIndividual nameWithRoleInd = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
442 if (!createNewNameWithRole) { // schon klar, dass er nicht existiert
fb3f3df002df first release
dwinter
parents:
diff changeset
443 nameWithRoleInd = getNameWithRole(nameInd, roleInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
444 }
fb3f3df002df first release
dwinter
parents:
diff changeset
445
fb3f3df002df first release
dwinter
parents:
diff changeset
446 if (nameWithRoleInd == null) { // existiert nicht
fb3f3df002df first release
dwinter
parents:
diff changeset
447 nameWithRoleInd = createNameWithRole(nameInd, roleInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
448 }
fb3f3df002df first release
dwinter
parents:
diff changeset
449
fb3f3df002df first release
dwinter
parents:
diff changeset
450 return nameWithRoleInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
451 }
fb3f3df002df first release
dwinter
parents:
diff changeset
452
fb3f3df002df first release
dwinter
parents:
diff changeset
453 private OWLIndividual getNameWithRole(OWLIndividual nameInd,
fb3f3df002df first release
dwinter
parents:
diff changeset
454 OWLIndividual roleInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
455 List<OWLIndividual> indicesWithNames = owlDoc.getIndividuals(
fb3f3df002df first release
dwinter
parents:
diff changeset
456 "IndicesNameWithRole", "refers_to_name", nameInd); // suche alle
fb3f3df002df first release
dwinter
parents:
diff changeset
457 // infrage
fb3f3df002df first release
dwinter
parents:
diff changeset
458 // kommenden
fb3f3df002df first release
dwinter
parents:
diff changeset
459 // nameen
fb3f3df002df first release
dwinter
parents:
diff changeset
460
fb3f3df002df first release
dwinter
parents:
diff changeset
461 if (indicesWithNames == null) { // kein Treffer
fb3f3df002df first release
dwinter
parents:
diff changeset
462 return null;
fb3f3df002df first release
dwinter
parents:
diff changeset
463 }
fb3f3df002df first release
dwinter
parents:
diff changeset
464
fb3f3df002df first release
dwinter
parents:
diff changeset
465 for (OWLIndividual name : indicesWithNames) {
fb3f3df002df first release
dwinter
parents:
diff changeset
466 Object role = owlDoc.getRelatedIndividual(name, "refers_to_role");
fb3f3df002df first release
dwinter
parents:
diff changeset
467 if (roleInd.equals(role)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
468 return name;
fb3f3df002df first release
dwinter
parents:
diff changeset
469 }
fb3f3df002df first release
dwinter
parents:
diff changeset
470 }
fb3f3df002df first release
dwinter
parents:
diff changeset
471 return null;
fb3f3df002df first release
dwinter
parents:
diff changeset
472 }
fb3f3df002df first release
dwinter
parents:
diff changeset
473
fb3f3df002df first release
dwinter
parents:
diff changeset
474 private OWLIndividual createOrGetTipol(String typology) {
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
475 OWLIndividual tipol = owlDoc.createOrGetInstanceWithIdentifier("Typology","Identifier",typology,false);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
476 return tipol;
fb3f3df002df first release
dwinter
parents:
diff changeset
477 }
fb3f3df002df first release
dwinter
parents:
diff changeset
478
fb3f3df002df first release
dwinter
parents:
diff changeset
479 private OWLIndividual createNameWithRole(OWLIndividual nameInd,
fb3f3df002df first release
dwinter
parents:
diff changeset
480 OWLIndividual roleInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
481
fb3f3df002df first release
dwinter
parents:
diff changeset
482 OWLIndividual nameWithRoleInd = owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
483 .createInstance("IndicesNameWithRole");
fb3f3df002df first release
dwinter
parents:
diff changeset
484
fb3f3df002df first release
dwinter
parents:
diff changeset
485 owlDoc.setProperty(nameWithRoleInd, "refers_to_name", nameInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
486 owlDoc.setProperty(nameWithRoleInd, "refers_to_role", roleInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
487
fb3f3df002df first release
dwinter
parents:
diff changeset
488 return nameWithRoleInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
489
fb3f3df002df first release
dwinter
parents:
diff changeset
490 }
fb3f3df002df first release
dwinter
parents:
diff changeset
491
fb3f3df002df first release
dwinter
parents:
diff changeset
492 private OWLIndividual createOrGetInstitution(String name) {
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
493 OWLIndividual nameInd = owlDoc.createOrGetInstanceWithIdentifier("IndicesInstitutions","IdentifierInstitutions",name,false);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
494
fb3f3df002df first release
dwinter
parents:
diff changeset
495 return nameInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
496 }
fb3f3df002df first release
dwinter
parents:
diff changeset
497
fb3f3df002df first release
dwinter
parents:
diff changeset
498 private OWLIndividual createOrGetName(String name) {
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
499 OWLIndividual nameInd = owlDoc.createOrGetInstanceWithIdentifier("IndicesNames","IdentifierNames",name,false);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
500 return nameInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
501 }
fb3f3df002df first release
dwinter
parents:
diff changeset
502
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
503 private OWLIndividual createOrGetRole(String name) {
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
504 OWLIndividual roleInd = owlDoc.createOrGetInstanceWithIdentifier("IndicesRoles","IdentifierRoles",name,false);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
505 return roleInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
506 }
fb3f3df002df first release
dwinter
parents:
diff changeset
507
fb3f3df002df first release
dwinter
parents:
diff changeset
508 private OWLIndividual createRecord(Element record, OWLIndividual cardInd)
fb3f3df002df first release
dwinter
parents:
diff changeset
509 throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
510 OWLIndividual recordInstance = owlDoc.createInstance("Record");
fb3f3df002df first release
dwinter
parents:
diff changeset
511 owlDoc.setProperty(recordInstance, "is_on_card", cardInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
512 createNewDependingInstanceFromXpath(record, recordInstance, "./@id",
fb3f3df002df first release
dwinter
parents:
diff changeset
513 new String[] { "has_readable_id", "rdfs:label" },
fb3f3df002df first release
dwinter
parents:
diff changeset
514 "IdentifierCurrent", "crm:P48_has_preferred_identifier");
fb3f3df002df first release
dwinter
parents:
diff changeset
515
fb3f3df002df first release
dwinter
parents:
diff changeset
516 String value = lexDoc.getValue(record, ".//textblockid");
fb3f3df002df first release
dwinter
parents:
diff changeset
517 if (!value.equals(""))
fb3f3df002df first release
dwinter
parents:
diff changeset
518 owlDoc.setProperty(recordInstance, "has_textblockid", value);
fb3f3df002df first release
dwinter
parents:
diff changeset
519
fb3f3df002df first release
dwinter
parents:
diff changeset
520 String endOnCarta = lexDoc.getValue(record, "./@end_on_carta");
fb3f3df002df first release
dwinter
parents:
diff changeset
521 if (!endOnCarta.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
522 OWLIndividual signature = (OWLIndividual) owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
523 .getRelatedIndividual(cardInd, "has_signature");
fb3f3df002df first release
dwinter
parents:
diff changeset
524 addRecordToCarta(recordInstance, value, signature);
fb3f3df002df first release
dwinter
parents:
diff changeset
525 }
fb3f3df002df first release
dwinter
parents:
diff changeset
526
fb3f3df002df first release
dwinter
parents:
diff changeset
527 String dateDcStart = lexDoc.getValue(record, ".//datdc/startdate");
fb3f3df002df first release
dwinter
parents:
diff changeset
528 String dateDcEnd = lexDoc.getValue(record, ".//datdc/startdate");
fb3f3df002df first release
dwinter
parents:
diff changeset
529
fb3f3df002df first release
dwinter
parents:
diff changeset
530 OWLIndividual timeSpan = owlDoc.createTimeSpan(dateDcStart, dateDcEnd);
fb3f3df002df first release
dwinter
parents:
diff changeset
531
fb3f3df002df first release
dwinter
parents:
diff changeset
532 owlDoc.setProperty(recordInstance, "crm:P4_has_time-span", timeSpan);
fb3f3df002df first release
dwinter
parents:
diff changeset
533
fb3f3df002df first release
dwinter
parents:
diff changeset
534 return recordInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
535 }
fb3f3df002df first release
dwinter
parents:
diff changeset
536
fb3f3df002df first release
dwinter
parents:
diff changeset
537 private void addRecordToCarta(OWLIndividual recordInstance, String cardID,
fb3f3df002df first release
dwinter
parents:
diff changeset
538 OWLIndividual signature) {
fb3f3df002df first release
dwinter
parents:
diff changeset
539
fb3f3df002df first release
dwinter
parents:
diff changeset
540 OWLIndividual card = owlDoc.getIndividualByReadableId("Card", cardID);
fb3f3df002df first release
dwinter
parents:
diff changeset
541
fb3f3df002df first release
dwinter
parents:
diff changeset
542 if (card == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
543 card = createCard(cardID, signature);
fb3f3df002df first release
dwinter
parents:
diff changeset
544 }
fb3f3df002df first release
dwinter
parents:
diff changeset
545
fb3f3df002df first release
dwinter
parents:
diff changeset
546 owlDoc.setProperty(recordInstance, "is_on_card", card);
fb3f3df002df first release
dwinter
parents:
diff changeset
547 }
fb3f3df002df first release
dwinter
parents:
diff changeset
548
fb3f3df002df first release
dwinter
parents:
diff changeset
549 private OWLIndividual createSignature(Element signature)
fb3f3df002df first release
dwinter
parents:
diff changeset
550 throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
551 Element segHeaderElement = (Element) XPath.selectSingleNode(signature,
fb3f3df002df first release
dwinter
parents:
diff changeset
552 ".//segheader");
fb3f3df002df first release
dwinter
parents:
diff changeset
553 String segheader = segHeaderElement.getTextTrim();
fb3f3df002df first release
dwinter
parents:
diff changeset
554
fb3f3df002df first release
dwinter
parents:
diff changeset
555 OWLIndividual signatureInstance = owlDoc.createInstance("Signatur");
fb3f3df002df first release
dwinter
parents:
diff changeset
556 owlDoc.setProperty(signatureInstance, "rdfs:label", segheader);
fb3f3df002df first release
dwinter
parents:
diff changeset
557 return signatureInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
558 }
fb3f3df002df first release
dwinter
parents:
diff changeset
559
fb3f3df002df first release
dwinter
parents:
diff changeset
560 private OWLIndividual createCard(String cardId, OWLIndividual signature) {
fb3f3df002df first release
dwinter
parents:
diff changeset
561
fb3f3df002df first release
dwinter
parents:
diff changeset
562 OWLIndividual cardInstance = owlDoc.createInstance("Card");
fb3f3df002df first release
dwinter
parents:
diff changeset
563
fb3f3df002df first release
dwinter
parents:
diff changeset
564 owlDoc.setProperty(cardInstance, "has_signature", signature);
fb3f3df002df first release
dwinter
parents:
diff changeset
565
fb3f3df002df first release
dwinter
parents:
diff changeset
566 OWLIndividual preferredId = owlDoc.createInstance("IdentifierCurrent");
fb3f3df002df first release
dwinter
parents:
diff changeset
567 owlDoc.setProperty(preferredId, "has_readable_id", cardId);
fb3f3df002df first release
dwinter
parents:
diff changeset
568 owlDoc.setProperty(preferredId, "rdfs:label", cardId);
fb3f3df002df first release
dwinter
parents:
diff changeset
569
fb3f3df002df first release
dwinter
parents:
diff changeset
570 owlDoc.setProperty(cardInstance, "crm:P48_has_preferred_identifier",
fb3f3df002df first release
dwinter
parents:
diff changeset
571 preferredId);
fb3f3df002df first release
dwinter
parents:
diff changeset
572
fb3f3df002df first release
dwinter
parents:
diff changeset
573 return cardInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
574 }
fb3f3df002df first release
dwinter
parents:
diff changeset
575
fb3f3df002df first release
dwinter
parents:
diff changeset
576 private OWLIndividual createCard(Element card, OWLIndividual signatureInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
577
fb3f3df002df first release
dwinter
parents:
diff changeset
578 OWLIndividual cardInstance = owlDoc.createInstance("Card");
fb3f3df002df first release
dwinter
parents:
diff changeset
579
fb3f3df002df first release
dwinter
parents:
diff changeset
580 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
581
fb3f3df002df first release
dwinter
parents:
diff changeset
582 createNewDependingInstanceFromXpath(card, cardInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
583 ".//cartanr", new String[] { "has_readable_id",
fb3f3df002df first release
dwinter
parents:
diff changeset
584 "rdfs:label" }, "IdentifierCurrent",
fb3f3df002df first release
dwinter
parents:
diff changeset
585 "crm:P48_has_preferred_identifier");
fb3f3df002df first release
dwinter
parents:
diff changeset
586
fb3f3df002df first release
dwinter
parents:
diff changeset
587 createNewDependingInstanceFromXpath(card, cardInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
588 ".//cartaant", new String[] { "has_readable_id",
fb3f3df002df first release
dwinter
parents:
diff changeset
589 "rdfs:label" }, "IdentifierCurrent",
fb3f3df002df first release
dwinter
parents:
diff changeset
590 "crm:P1_is_identified_by");
fb3f3df002df first release
dwinter
parents:
diff changeset
591
fb3f3df002df first release
dwinter
parents:
diff changeset
592 owlDoc.setProperty(cardInstance, "has_signature", signatureInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
593
fb3f3df002df first release
dwinter
parents:
diff changeset
594 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
595 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
596 return null;
fb3f3df002df first release
dwinter
parents:
diff changeset
597 }
fb3f3df002df first release
dwinter
parents:
diff changeset
598
fb3f3df002df first release
dwinter
parents:
diff changeset
599 return cardInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
600 }
fb3f3df002df first release
dwinter
parents:
diff changeset
601
fb3f3df002df first release
dwinter
parents:
diff changeset
602 private void createNewDependingInstanceFromXpath(Element card,
fb3f3df002df first release
dwinter
parents:
diff changeset
603 OWLIndividual cardInstance, String xpath, String[] propertyNames,
fb3f3df002df first release
dwinter
parents:
diff changeset
604 String newInstanceClassName, String relationNameToNewInstance)
fb3f3df002df first release
dwinter
parents:
diff changeset
605 throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
606
fb3f3df002df first release
dwinter
parents:
diff changeset
607 List<?> identifierIdEls = (List<?>) XPath.selectNodes(card, xpath);
fb3f3df002df first release
dwinter
parents:
diff changeset
608 for (Object identifierIdEl : identifierIdEls) {
fb3f3df002df first release
dwinter
parents:
diff changeset
609 String identifierId = "";
fb3f3df002df first release
dwinter
parents:
diff changeset
610 if (Element.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
611 identifierId = ((Element) identifierIdEl).getTextTrim();
fb3f3df002df first release
dwinter
parents:
diff changeset
612 } else if (Attribute.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
613 identifierId = ((Attribute) identifierIdEl).getValue();
fb3f3df002df first release
dwinter
parents:
diff changeset
614 }
fb3f3df002df first release
dwinter
parents:
diff changeset
615
fb3f3df002df first release
dwinter
parents:
diff changeset
616 OWLIndividual identifier = owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
617 .createInstance(newInstanceClassName);
fb3f3df002df first release
dwinter
parents:
diff changeset
618 for (int i = 0; i < propertyNames.length; i++) {
fb3f3df002df first release
dwinter
parents:
diff changeset
619 owlDoc.setProperty(identifier, propertyNames[i], identifierId);
fb3f3df002df first release
dwinter
parents:
diff changeset
620 }
fb3f3df002df first release
dwinter
parents:
diff changeset
621
fb3f3df002df first release
dwinter
parents:
diff changeset
622 owlDoc.setProperty(cardInstance, relationNameToNewInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
623 identifier);
fb3f3df002df first release
dwinter
parents:
diff changeset
624 }
fb3f3df002df first release
dwinter
parents:
diff changeset
625
fb3f3df002df first release
dwinter
parents:
diff changeset
626 }
fb3f3df002df first release
dwinter
parents:
diff changeset
627
fb3f3df002df first release
dwinter
parents:
diff changeset
628 // createNewDependingDataTypePropertyFromXpath(record, eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
629 // ".//resges/italian", "has_reges",
fb3f3df002df first release
dwinter
parents:
diff changeset
630 // "italian");
fb3f3df002df first release
dwinter
parents:
diff changeset
631 private void createNewDependingDataTypePropertyFromXpath(Element record,
fb3f3df002df first release
dwinter
parents:
diff changeset
632 OWLIndividual eventInstance, String xpath, String propertyName,
fb3f3df002df first release
dwinter
parents:
diff changeset
633 String lang) throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
634
fb3f3df002df first release
dwinter
parents:
diff changeset
635 List<?> identifierIdEls = (List<?>) XPath.selectNodes(record, xpath);
fb3f3df002df first release
dwinter
parents:
diff changeset
636 for (Object identifierIdEl : identifierIdEls) {
fb3f3df002df first release
dwinter
parents:
diff changeset
637 String identifierId = "";
fb3f3df002df first release
dwinter
parents:
diff changeset
638 if (Element.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
639 identifierId = ((Element) identifierIdEl).getTextTrim();
fb3f3df002df first release
dwinter
parents:
diff changeset
640 } else if (Attribute.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
641 identifierId = ((Attribute) identifierIdEl).getValue();
fb3f3df002df first release
dwinter
parents:
diff changeset
642 }
fb3f3df002df first release
dwinter
parents:
diff changeset
643
fb3f3df002df first release
dwinter
parents:
diff changeset
644 owlDoc.setDataTypePropery(eventInstance, propertyName,
fb3f3df002df first release
dwinter
parents:
diff changeset
645 identifierId, lang);
fb3f3df002df first release
dwinter
parents:
diff changeset
646 }
fb3f3df002df first release
dwinter
parents:
diff changeset
647 }
fb3f3df002df first release
dwinter
parents:
diff changeset
648 }