annotate src/de/mpiwg/dwinter/duomo/lexdump/LexOWLTransformer.java @ 2:273164f81926

bug in transformer handleroles
author dwinter
date Thu, 03 Feb 2011 16:08:06 +0100
parents 0fa29ab5e5e0
children d9fd32ecae24
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
fb3f3df002df first release
dwinter
parents:
diff changeset
1 package de.mpiwg.dwinter.duomo.lexdump;
fb3f3df002df first release
dwinter
parents:
diff changeset
2
1
dwinter
parents: 0
diff changeset
3 import java.io.File;
dwinter
parents: 0
diff changeset
4 import java.io.FileWriter;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
5 import java.io.IOException;
fb3f3df002df first release
dwinter
parents:
diff changeset
6 import java.net.URI;
fb3f3df002df first release
dwinter
parents:
diff changeset
7 import java.net.URISyntaxException;
fb3f3df002df first release
dwinter
parents:
diff changeset
8 import java.net.URLEncoder;
fb3f3df002df first release
dwinter
parents:
diff changeset
9 import java.util.Collection;
fb3f3df002df first release
dwinter
parents:
diff changeset
10 import java.util.HashMap;
fb3f3df002df first release
dwinter
parents:
diff changeset
11 import java.util.HashSet;
fb3f3df002df first release
dwinter
parents:
diff changeset
12 import java.util.Iterator;
fb3f3df002df first release
dwinter
parents:
diff changeset
13 import java.util.List;
fb3f3df002df first release
dwinter
parents:
diff changeset
14 import java.util.Map;
fb3f3df002df first release
dwinter
parents:
diff changeset
15 import java.util.Set;
fb3f3df002df first release
dwinter
parents:
diff changeset
16
fb3f3df002df first release
dwinter
parents:
diff changeset
17 import javax.print.URIException;
fb3f3df002df first release
dwinter
parents:
diff changeset
18
fb3f3df002df first release
dwinter
parents:
diff changeset
19 import org.apache.log4j.Level;
fb3f3df002df first release
dwinter
parents:
diff changeset
20 import org.apache.log4j.Logger;
fb3f3df002df first release
dwinter
parents:
diff changeset
21 import org.jdom.Attribute;
fb3f3df002df first release
dwinter
parents:
diff changeset
22 import org.jdom.Element;
fb3f3df002df first release
dwinter
parents:
diff changeset
23 import org.jdom.JDOMException;
fb3f3df002df first release
dwinter
parents:
diff changeset
24 import org.jdom.xpath.XPath;
fb3f3df002df first release
dwinter
parents:
diff changeset
25
fb3f3df002df first release
dwinter
parents:
diff changeset
26 import com.sun.xml.internal.ws.developer.MemberSubmissionEndpointReference.Elements;
fb3f3df002df first release
dwinter
parents:
diff changeset
27
fb3f3df002df first release
dwinter
parents:
diff changeset
28 import edu.stanford.smi.protege.exception.OntologyLoadException;
fb3f3df002df first release
dwinter
parents:
diff changeset
29 import edu.stanford.smi.protege.model.Instance;
fb3f3df002df first release
dwinter
parents:
diff changeset
30 import edu.stanford.smi.protegex.owl.model.OWLAllValuesFrom;
fb3f3df002df first release
dwinter
parents:
diff changeset
31 import edu.stanford.smi.protegex.owl.model.OWLClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
32 import edu.stanford.smi.protegex.owl.model.OWLDataRange;
fb3f3df002df first release
dwinter
parents:
diff changeset
33 import edu.stanford.smi.protegex.owl.model.OWLIndividual;
fb3f3df002df first release
dwinter
parents:
diff changeset
34 import edu.stanford.smi.protegex.owl.model.OWLNamedClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
35 import edu.stanford.smi.protegex.owl.model.OWLProperty;
fb3f3df002df first release
dwinter
parents:
diff changeset
36 import edu.stanford.smi.protegex.owl.model.OWLUnionClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
37 import edu.stanford.smi.protegex.owl.model.RDFList;
fb3f3df002df first release
dwinter
parents:
diff changeset
38 import edu.stanford.smi.protegex.owl.model.RDFProperty;
fb3f3df002df first release
dwinter
parents:
diff changeset
39 import edu.stanford.smi.protegex.owl.model.RDFResource;
fb3f3df002df first release
dwinter
parents:
diff changeset
40 import edu.stanford.smi.protegex.owl.model.impl.AbstractOWLQuantifierRestriction;
fb3f3df002df first release
dwinter
parents:
diff changeset
41 import edu.stanford.smi.protegex.owl.model.impl.DefaultOWLUnionClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
42
fb3f3df002df first release
dwinter
parents:
diff changeset
43 public class LexOWLTransformer {
fb3f3df002df first release
dwinter
parents:
diff changeset
44 private Logger logger = Logger.getRootLogger();
1
dwinter
parents: 0
diff changeset
45 private FileWriter missing;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
46 private OWLImporter owlDoc;
fb3f3df002df first release
dwinter
parents:
diff changeset
47 private LexDumpImporter lexDoc;
fb3f3df002df first release
dwinter
parents:
diff changeset
48 private Map<String, OWLIndividual> individualIds = new HashMap<String, OWLIndividual>(); // speichere
fb3f3df002df first release
dwinter
parents:
diff changeset
49 // ids
fb3f3df002df first release
dwinter
parents:
diff changeset
50 // fuer
fb3f3df002df first release
dwinter
parents:
diff changeset
51 // weitere
fb3f3df002df first release
dwinter
parents:
diff changeset
52 // Verwendung
fb3f3df002df first release
dwinter
parents:
diff changeset
53
1
dwinter
parents: 0
diff changeset
54 public LexOWLTransformer(OWLImporter owlDoc, LexDumpImporter lexDoc) throws IOException {
0
fb3f3df002df first release
dwinter
parents:
diff changeset
55 this.owlDoc = owlDoc;
fb3f3df002df first release
dwinter
parents:
diff changeset
56 this.lexDoc = lexDoc;
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
57 missing = new FileWriter(new File("/tmp/missing.out"));
0
fb3f3df002df first release
dwinter
parents:
diff changeset
58 }
fb3f3df002df first release
dwinter
parents:
diff changeset
59
fb3f3df002df first release
dwinter
parents:
diff changeset
60 /**
fb3f3df002df first release
dwinter
parents:
diff changeset
61 * @param args
fb3f3df002df first release
dwinter
parents:
diff changeset
62 * @throws Exception
fb3f3df002df first release
dwinter
parents:
diff changeset
63 */
fb3f3df002df first release
dwinter
parents:
diff changeset
64 public static void main(String[] args) throws Exception {
fb3f3df002df first release
dwinter
parents:
diff changeset
65 Logger.getRootLogger().setLevel(Level.DEBUG);
fb3f3df002df first release
dwinter
parents:
diff changeset
66 // Import OWL
fb3f3df002df first release
dwinter
parents:
diff changeset
67 //String base = "/Users/dwinter/Documents/Projekte/Diss - data-mining/eclipseWorkspace/de.mpiwg.dwinter.duomo/owlInput";
fb3f3df002df first release
dwinter
parents:
diff changeset
68 String base=args[0];
fb3f3df002df first release
dwinter
parents:
diff changeset
69 String baseUri= base.replace(" ", "%20");
fb3f3df002df first release
dwinter
parents:
diff changeset
70 URI ontologieUri = new URI("file://"+baseUri+"/duomoAnalysis.owl");
fb3f3df002df first release
dwinter
parents:
diff changeset
71 //URI ontologieUri = new URI(
fb3f3df002df first release
dwinter
parents:
diff changeset
72 // "file:///Users/dwinter/Documents/Projekte/Diss%20-%20data-mining/eclipseWorkspace/de.mpiwg.dwinter.duomo/owlInput/duomoAnalysis.owl");
fb3f3df002df first release
dwinter
parents:
diff changeset
73 OWLImporter owlDoc = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
74 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
75
fb3f3df002df first release
dwinter
parents:
diff changeset
76 owlDoc = new OWLImporter(base, ontologieUri);
fb3f3df002df first release
dwinter
parents:
diff changeset
77 // owlDoc.printModel();
fb3f3df002df first release
dwinter
parents:
diff changeset
78 } catch (OntologyLoadException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
79 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
80 System.exit(-1);
fb3f3df002df first release
dwinter
parents:
diff changeset
81 }
fb3f3df002df first release
dwinter
parents:
diff changeset
82 // read and parse lexfile
fb3f3df002df first release
dwinter
parents:
diff changeset
83 //String lexFile = "/Users/dwinter/Documents/Projekte/Diss - data-mining/eclipseWorkspace/duomoData/LEXXDUMP.xml";
fb3f3df002df first release
dwinter
parents:
diff changeset
84 String lexFile=args[1];
fb3f3df002df first release
dwinter
parents:
diff changeset
85 LexDumpImporter lexDoc = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
86 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
87 lexDoc = new LexDumpImporter(lexFile);
fb3f3df002df first release
dwinter
parents:
diff changeset
88 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
89 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
90 System.exit(-1);
fb3f3df002df first release
dwinter
parents:
diff changeset
91 } catch (IOException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
92 System.exit(-1);
fb3f3df002df first release
dwinter
parents:
diff changeset
93 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
94 }
fb3f3df002df first release
dwinter
parents:
diff changeset
95
fb3f3df002df first release
dwinter
parents:
diff changeset
96 // List<Element> cartas = lexDoc.getCartas();
fb3f3df002df first release
dwinter
parents:
diff changeset
97 // System.out.println(cartas.size());
fb3f3df002df first release
dwinter
parents:
diff changeset
98
fb3f3df002df first release
dwinter
parents:
diff changeset
99 LexOWLTransformer tf = new LexOWLTransformer(owlDoc, lexDoc);
fb3f3df002df first release
dwinter
parents:
diff changeset
100 tf.transform();
fb3f3df002df first release
dwinter
parents:
diff changeset
101 owlDoc.save("file:///tmp/out.owl");
fb3f3df002df first release
dwinter
parents:
diff changeset
102 }
fb3f3df002df first release
dwinter
parents:
diff changeset
103
fb3f3df002df first release
dwinter
parents:
diff changeset
104 private void transform() throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
105 List<Element> signatures = lexDoc.getSignatures();
fb3f3df002df first release
dwinter
parents:
diff changeset
106
fb3f3df002df first release
dwinter
parents:
diff changeset
107 // Element signature = signatures.get(0);
fb3f3df002df first release
dwinter
parents:
diff changeset
108 int signatureCount = 1;
fb3f3df002df first release
dwinter
parents:
diff changeset
109 int maxsign = signatures.size();
fb3f3df002df first release
dwinter
parents:
diff changeset
110 for (Element signature : signatures) {
fb3f3df002df first release
dwinter
parents:
diff changeset
111 logger.debug(String.format("Signature: %s (%s)", signatureCount,
fb3f3df002df first release
dwinter
parents:
diff changeset
112 maxsign));
fb3f3df002df first release
dwinter
parents:
diff changeset
113 OWLIndividual signatureInd = createSignature(signature);
fb3f3df002df first release
dwinter
parents:
diff changeset
114
fb3f3df002df first release
dwinter
parents:
diff changeset
115 @SuppressWarnings("unchecked")
fb3f3df002df first release
dwinter
parents:
diff changeset
116 List<Element> cards = XPath.selectNodes(signature, ".//carta");
fb3f3df002df first release
dwinter
parents:
diff changeset
117 int cardsCount = 1;
fb3f3df002df first release
dwinter
parents:
diff changeset
118 int maxcards = cards.size();
fb3f3df002df first release
dwinter
parents:
diff changeset
119
fb3f3df002df first release
dwinter
parents:
diff changeset
120 // Element card=cards.get(0);
fb3f3df002df first release
dwinter
parents:
diff changeset
121 for (Element card : cards) {
fb3f3df002df first release
dwinter
parents:
diff changeset
122 logger.debug(String.format("Cards: %s (%s)", cardsCount++,
fb3f3df002df first release
dwinter
parents:
diff changeset
123 maxcards));
fb3f3df002df first release
dwinter
parents:
diff changeset
124 logger.debug(String.format("Signature: %s (%s)",
fb3f3df002df first release
dwinter
parents:
diff changeset
125 signatureCount, maxsign));
fb3f3df002df first release
dwinter
parents:
diff changeset
126 OWLIndividual cardInd = createCard(card, signatureInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
127
fb3f3df002df first release
dwinter
parents:
diff changeset
128 @SuppressWarnings("unchecked")
fb3f3df002df first release
dwinter
parents:
diff changeset
129 List<Element> records = XPath.selectNodes(card, ".//record");
fb3f3df002df first release
dwinter
parents:
diff changeset
130 for (Element record : records) {
fb3f3df002df first release
dwinter
parents:
diff changeset
131 // Element record = records.get(0);
fb3f3df002df first release
dwinter
parents:
diff changeset
132 OWLIndividual recordInd = createRecord(record, cardInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
133 OWLIndividual recordEvent = createEvent(record, recordInd); // Event
fb3f3df002df first release
dwinter
parents:
diff changeset
134 // und
fb3f3df002df first release
dwinter
parents:
diff changeset
135 // Records
fb3f3df002df first release
dwinter
parents:
diff changeset
136 // sind
fb3f3df002df first release
dwinter
parents:
diff changeset
137 // im
fb3f3df002df first release
dwinter
parents:
diff changeset
138 // Original
fb3f3df002df first release
dwinter
parents:
diff changeset
139 // im
fb3f3df002df first release
dwinter
parents:
diff changeset
140 // record-tag
fb3f3df002df first release
dwinter
parents:
diff changeset
141 }
fb3f3df002df first release
dwinter
parents:
diff changeset
142 }
fb3f3df002df first release
dwinter
parents:
diff changeset
143 signatureCount++;
fb3f3df002df first release
dwinter
parents:
diff changeset
144 }
fb3f3df002df first release
dwinter
parents:
diff changeset
145 owlDoc.printModel();
fb3f3df002df first release
dwinter
parents:
diff changeset
146 }
fb3f3df002df first release
dwinter
parents:
diff changeset
147
fb3f3df002df first release
dwinter
parents:
diff changeset
148 private OWLIndividual createEvent(Element record, OWLIndividual recordInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
149
fb3f3df002df first release
dwinter
parents:
diff changeset
150 logger.debug("Create Event");
fb3f3df002df first release
dwinter
parents:
diff changeset
151 OWLIndividual eventInstance = owlDoc.createInstance("RecordedEvent");
fb3f3df002df first release
dwinter
parents:
diff changeset
152
fb3f3df002df first release
dwinter
parents:
diff changeset
153 owlDoc.setProperty(recordInd, "crm:P70_documents", eventInstance);
fb3f3df002df first release
dwinter
parents:
diff changeset
154
fb3f3df002df first release
dwinter
parents:
diff changeset
155 // timespan
fb3f3df002df first release
dwinter
parents:
diff changeset
156
fb3f3df002df first release
dwinter
parents:
diff changeset
157 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
158 String dateDcStart = lexDoc.getValue(record, ".//datdf/startdate");
fb3f3df002df first release
dwinter
parents:
diff changeset
159
fb3f3df002df first release
dwinter
parents:
diff changeset
160 String dateDcEnd = lexDoc.getValue(record, ".//datdf/startdate");
fb3f3df002df first release
dwinter
parents:
diff changeset
161
fb3f3df002df first release
dwinter
parents:
diff changeset
162 if (!dateDcStart.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
163 OWLIndividual timeSpan = owlDoc.createTimeSpan(dateDcStart,
fb3f3df002df first release
dwinter
parents:
diff changeset
164 dateDcEnd);
fb3f3df002df first release
dwinter
parents:
diff changeset
165 owlDoc.setProperty(eventInstance, "crm:P4_has_time-span",
fb3f3df002df first release
dwinter
parents:
diff changeset
166 timeSpan);
fb3f3df002df first release
dwinter
parents:
diff changeset
167 }
fb3f3df002df first release
dwinter
parents:
diff changeset
168 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
169 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
170 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
171 }
fb3f3df002df first release
dwinter
parents:
diff changeset
172
fb3f3df002df first release
dwinter
parents:
diff changeset
173 // tipol
fb3f3df002df first release
dwinter
parents:
diff changeset
174 String typology;
fb3f3df002df first release
dwinter
parents:
diff changeset
175 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
176 typology = lexDoc.getValue(record, ".//tipol");
fb3f3df002df first release
dwinter
parents:
diff changeset
177 OWLIndividual typolInd = createOrGetTipol(typology);
fb3f3df002df first release
dwinter
parents:
diff changeset
178 owlDoc.setProperty(eventInstance, "has_tipol", typolInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
179
fb3f3df002df first release
dwinter
parents:
diff changeset
180 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
181 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
182 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
183 }
fb3f3df002df first release
dwinter
parents:
diff changeset
184
fb3f3df002df first release
dwinter
parents:
diff changeset
185 // reges
fb3f3df002df first release
dwinter
parents:
diff changeset
186 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
187 createNewDependingDataTypePropertyFromXpath(record, eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
188 ".//reges/italian", "has_reges", "it");
fb3f3df002df first release
dwinter
parents:
diff changeset
189 createNewDependingDataTypePropertyFromXpath(record, eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
190 ".//reges/english", "has_reges", "en");
fb3f3df002df first release
dwinter
parents:
diff changeset
191 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
192 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
193 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
194 }
fb3f3df002df first release
dwinter
parents:
diff changeset
195
fb3f3df002df first release
dwinter
parents:
diff changeset
196 // nomiq
fb3f3df002df first release
dwinter
parents:
diff changeset
197
fb3f3df002df first release
dwinter
parents:
diff changeset
198 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
199 @SuppressWarnings("unchecked")
fb3f3df002df first release
dwinter
parents:
diff changeset
200 List<Element> nomiqs = XPath.selectNodes(record, ".//nomiq");
fb3f3df002df first release
dwinter
parents:
diff changeset
201 OWLIndividual recordNamesRoles = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
202 for (Element nomiq : nomiqs) {
fb3f3df002df first release
dwinter
parents:
diff changeset
203 String name = lexDoc.getValue(nomiq, "./name");
fb3f3df002df first release
dwinter
parents:
diff changeset
204 String role = lexDoc.getValue(nomiq, "./role");
fb3f3df002df first release
dwinter
parents:
diff changeset
205
fb3f3df002df first release
dwinter
parents:
diff changeset
206 if (!name.equals("") && !role.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
207 recordNamesRoles = handleNameWithRole(recordInd, name, role);
fb3f3df002df first release
dwinter
parents:
diff changeset
208 } else if (!role.equals("")) {
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
209 recordNamesRoles = createOrGetRole(role);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
210 } else if (!name.equals("")) {
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
211 recordNamesRoles = createOrGetName(name);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
212 }
fb3f3df002df first release
dwinter
parents:
diff changeset
213
fb3f3df002df first release
dwinter
parents:
diff changeset
214 if (recordNamesRoles != null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
215 owlDoc.setProperty(eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
216 "recordsDuomoObjectNameRoles", recordNamesRoles);
fb3f3df002df first release
dwinter
parents:
diff changeset
217 String id = lexDoc.getValue(nomiq, "./@id");
fb3f3df002df first release
dwinter
parents:
diff changeset
218 individualIds.put(id, recordNamesRoles);
fb3f3df002df first release
dwinter
parents:
diff changeset
219 }
fb3f3df002df first release
dwinter
parents:
diff changeset
220 }
fb3f3df002df first release
dwinter
parents:
diff changeset
221
fb3f3df002df first release
dwinter
parents:
diff changeset
222 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
223 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
224 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
225 }
fb3f3df002df first release
dwinter
parents:
diff changeset
226
fb3f3df002df first release
dwinter
parents:
diff changeset
227 // istit
fb3f3df002df first release
dwinter
parents:
diff changeset
228 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
229 String istit = lexDoc.getValue(record, "./istit");
fb3f3df002df first release
dwinter
parents:
diff changeset
230 OWLIndividual istitInd = owlDoc.getIndividualByReadableId(
fb3f3df002df first release
dwinter
parents:
diff changeset
231 "IndicesInstitutions", istit);
fb3f3df002df first release
dwinter
parents:
diff changeset
232 if (istitInd == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
233 istitInd = createOrGetInstitution(istit);
fb3f3df002df first release
dwinter
parents:
diff changeset
234 }
fb3f3df002df first release
dwinter
parents:
diff changeset
235
fb3f3df002df first release
dwinter
parents:
diff changeset
236 owlDoc.setProperty(eventInstance, "recordsDuomoObjectInstitution",
fb3f3df002df first release
dwinter
parents:
diff changeset
237 istitInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
238
fb3f3df002df first release
dwinter
parents:
diff changeset
239 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
240 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
241 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
242 }
fb3f3df002df first release
dwinter
parents:
diff changeset
243
fb3f3df002df first release
dwinter
parents:
diff changeset
244 // types
fb3f3df002df first release
dwinter
parents:
diff changeset
245
fb3f3df002df first release
dwinter
parents:
diff changeset
246 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
247 List<Element> types = XPath.selectNodes(record, ".//type");
fb3f3df002df first release
dwinter
parents:
diff changeset
248 for (Element type : types) {
fb3f3df002df first release
dwinter
parents:
diff changeset
249 createType(eventInstance, type);
fb3f3df002df first release
dwinter
parents:
diff changeset
250 }
fb3f3df002df first release
dwinter
parents:
diff changeset
251 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
252 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
253 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
254 }
fb3f3df002df first release
dwinter
parents:
diff changeset
255
fb3f3df002df first release
dwinter
parents:
diff changeset
256 return eventInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
257 }
fb3f3df002df first release
dwinter
parents:
diff changeset
258
fb3f3df002df first release
dwinter
parents:
diff changeset
259 private void createType(OWLIndividual eventInstance, Element type) {
fb3f3df002df first release
dwinter
parents:
diff changeset
260
fb3f3df002df first release
dwinter
parents:
diff changeset
261 String typeId;
fb3f3df002df first release
dwinter
parents:
diff changeset
262 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
263 typeId = lexDoc.getValue(type, "./ptr/@target");
fb3f3df002df first release
dwinter
parents:
diff changeset
264 String clsName = owlDoc.getClassNameFromTypeId(typeId);
fb3f3df002df first release
dwinter
parents:
diff changeset
265 OWLNamedClass cls = owlDoc.getClassFromTypeId(typeId);
fb3f3df002df first release
dwinter
parents:
diff changeset
266 OWLIndividual typeInd = owlDoc.createInstance(clsName);
fb3f3df002df first release
dwinter
parents:
diff changeset
267
fb3f3df002df first release
dwinter
parents:
diff changeset
268 OWLNamedClass subjectClass = getPreferredTargetClass(cls,
fb3f3df002df first release
dwinter
parents:
diff changeset
269 "has_subject");
fb3f3df002df first release
dwinter
parents:
diff changeset
270 OWLNamedClass predicateClass = getPreferredTargetClass(cls,
fb3f3df002df first release
dwinter
parents:
diff changeset
271 "has_predicate");
fb3f3df002df first release
dwinter
parents:
diff changeset
272
fb3f3df002df first release
dwinter
parents:
diff changeset
273 List<Element> freeTexts = XPath.selectNodes(type, "./freetext");
fb3f3df002df first release
dwinter
parents:
diff changeset
274 for (Element freeText : freeTexts) {
fb3f3df002df first release
dwinter
parents:
diff changeset
275
fb3f3df002df first release
dwinter
parents:
diff changeset
276 String subjPointer = lexDoc.getValue(freeText,
fb3f3df002df first release
dwinter
parents:
diff changeset
277 "./sub/ptrtoperson/@target");
fb3f3df002df first release
dwinter
parents:
diff changeset
278 String subjText = lexDoc.getValue(freeText, "./sub");
fb3f3df002df first release
dwinter
parents:
diff changeset
279
fb3f3df002df first release
dwinter
parents:
diff changeset
280 OWLIndividual subjInd = createSubjectOrPredicate(subjectClass,
fb3f3df002df first release
dwinter
parents:
diff changeset
281 subjPointer, subjText);
fb3f3df002df first release
dwinter
parents:
diff changeset
282
fb3f3df002df first release
dwinter
parents:
diff changeset
283 String predPointer = lexDoc.getValue(freeText,
fb3f3df002df first release
dwinter
parents:
diff changeset
284 "./pred/ptrtoperson/@target");
fb3f3df002df first release
dwinter
parents:
diff changeset
285 String predText = lexDoc.getValue(freeText, "./pred");
fb3f3df002df first release
dwinter
parents:
diff changeset
286
fb3f3df002df first release
dwinter
parents:
diff changeset
287 OWLIndividual predInd = createSubjectOrPredicate(
fb3f3df002df first release
dwinter
parents:
diff changeset
288 predicateClass, predPointer, predText);
fb3f3df002df first release
dwinter
parents:
diff changeset
289
fb3f3df002df first release
dwinter
parents:
diff changeset
290 if (subjInd != null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
291 owlDoc.setProperty(typeInd, "has_subject", subjInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
292 }
fb3f3df002df first release
dwinter
parents:
diff changeset
293
fb3f3df002df first release
dwinter
parents:
diff changeset
294 if (predInd != null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
295 owlDoc.setProperty(typeInd, "has_predicate", predInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
296 }
fb3f3df002df first release
dwinter
parents:
diff changeset
297
fb3f3df002df first release
dwinter
parents:
diff changeset
298 owlDoc.setProperty(eventInstance, "recordsDuomoObjectConcept",
fb3f3df002df first release
dwinter
parents:
diff changeset
299 typeInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
300 }
fb3f3df002df first release
dwinter
parents:
diff changeset
301
fb3f3df002df first release
dwinter
parents:
diff changeset
302 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
303 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
304 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
305 }
fb3f3df002df first release
dwinter
parents:
diff changeset
306
fb3f3df002df first release
dwinter
parents:
diff changeset
307 }
fb3f3df002df first release
dwinter
parents:
diff changeset
308
fb3f3df002df first release
dwinter
parents:
diff changeset
309 private OWLIndividual createSubjectOrPredicate(OWLNamedClass toClass,
fb3f3df002df first release
dwinter
parents:
diff changeset
310 String subjPointer, String subjText) {
fb3f3df002df first release
dwinter
parents:
diff changeset
311 OWLIndividual subjInd = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
312
fb3f3df002df first release
dwinter
parents:
diff changeset
313 if (!subjPointer.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
314 subjInd = toClass.createOWLIndividual(null);
fb3f3df002df first release
dwinter
parents:
diff changeset
315 OWLIndividual ind = individualIds.get(subjPointer);
fb3f3df002df first release
dwinter
parents:
diff changeset
316 if (ind == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
317 logger.debug("target ID does not exist:" + subjPointer);
1
dwinter
parents: 0
diff changeset
318 try {
dwinter
parents: 0
diff changeset
319 missing.write("target ID does not exist:" + subjPointer+"\n");
dwinter
parents: 0
diff changeset
320 } catch (IOException e) {
dwinter
parents: 0
diff changeset
321 // TODO Auto-generated catch block
dwinter
parents: 0
diff changeset
322 e.printStackTrace();
dwinter
parents: 0
diff changeset
323 }
0
fb3f3df002df first release
dwinter
parents:
diff changeset
324 } else {
fb3f3df002df first release
dwinter
parents:
diff changeset
325 owlDoc.setProperty(subjInd, "has_NameOrRoleFromIndex", ind);
fb3f3df002df first release
dwinter
parents:
diff changeset
326 }
fb3f3df002df first release
dwinter
parents:
diff changeset
327 }
fb3f3df002df first release
dwinter
parents:
diff changeset
328
fb3f3df002df first release
dwinter
parents:
diff changeset
329 if (!subjText.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
330 if (subjInd == null)
fb3f3df002df first release
dwinter
parents:
diff changeset
331 subjInd = toClass.createOWLIndividual(null);
fb3f3df002df first release
dwinter
parents:
diff changeset
332
fb3f3df002df first release
dwinter
parents:
diff changeset
333 OWLNamedClass idcls = owlDoc.owlModel
fb3f3df002df first release
dwinter
parents:
diff changeset
334 .getOWLNamedClass("Identifier"); // is die klasse selbst
fb3f3df002df first release
dwinter
parents:
diff changeset
335 // schon ein identifiert
fb3f3df002df first release
dwinter
parents:
diff changeset
336 if (toClass.getNamedSuperclasses(true).contains(idcls)) { // to
fb3f3df002df first release
dwinter
parents:
diff changeset
337 owlDoc.setProperty(subjInd, "has_readable_id", subjText);
fb3f3df002df first release
dwinter
parents:
diff changeset
338 } else {
fb3f3df002df first release
dwinter
parents:
diff changeset
339
fb3f3df002df first release
dwinter
parents:
diff changeset
340 OWLIndividual ident = owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
341 .createInstance("IdentifierPredicateOrSubject");
fb3f3df002df first release
dwinter
parents:
diff changeset
342 owlDoc.setProperty(ident, "has_readable_id", subjText);
fb3f3df002df first release
dwinter
parents:
diff changeset
343 owlDoc.setProperty(subjInd, "crm:P48_has_preferred_identifier",
fb3f3df002df first release
dwinter
parents:
diff changeset
344 ident);
fb3f3df002df first release
dwinter
parents:
diff changeset
345 }
fb3f3df002df first release
dwinter
parents:
diff changeset
346 }
fb3f3df002df first release
dwinter
parents:
diff changeset
347 return subjInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
348 }
fb3f3df002df first release
dwinter
parents:
diff changeset
349
fb3f3df002df first release
dwinter
parents:
diff changeset
350 private OWLNamedClass getPreferredTargetClass(OWLNamedClass cls,
fb3f3df002df first release
dwinter
parents:
diff changeset
351 String propertyName) {
fb3f3df002df first release
dwinter
parents:
diff changeset
352 RDFProperty prop = owlDoc.owlModel.getRDFProperty(propertyName);
fb3f3df002df first release
dwinter
parents:
diff changeset
353
fb3f3df002df first release
dwinter
parents:
diff changeset
354 // finde welche klasse als subject erlaubt ist
fb3f3df002df first release
dwinter
parents:
diff changeset
355 Collection<?> restrictions = cls.getRestrictions(prop, true);
fb3f3df002df first release
dwinter
parents:
diff changeset
356
fb3f3df002df first release
dwinter
parents:
diff changeset
357 RDFResource restrictionValues = prop.getRange(); // nimm erstmal den
fb3f3df002df first release
dwinter
parents:
diff changeset
358 // gesammten Range
fb3f3df002df first release
dwinter
parents:
diff changeset
359
fb3f3df002df first release
dwinter
parents:
diff changeset
360 // schaue jetzt nach ob eb es einschraenkungen gibt.
fb3f3df002df first release
dwinter
parents:
diff changeset
361 for (Iterator<?> it = restrictions.iterator(); it.hasNext();) {
fb3f3df002df first release
dwinter
parents:
diff changeset
362 Object restriction = it.next();
fb3f3df002df first release
dwinter
parents:
diff changeset
363 if (OWLAllValuesFrom.class.isInstance(restriction)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
364 OWLAllValuesFrom ar = (OWLAllValuesFrom) restriction;
fb3f3df002df first release
dwinter
parents:
diff changeset
365 restrictionValues = ar.getAllValuesFrom();
fb3f3df002df first release
dwinter
parents:
diff changeset
366 break;
fb3f3df002df first release
dwinter
parents:
diff changeset
367 }
fb3f3df002df first release
dwinter
parents:
diff changeset
368
fb3f3df002df first release
dwinter
parents:
diff changeset
369 }
fb3f3df002df first release
dwinter
parents:
diff changeset
370 OWLNamedClass toClass = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
371 if (OWLNamedClass.class.isInstance(restrictionValues)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
372 toClass = (OWLNamedClass) restrictionValues;
fb3f3df002df first release
dwinter
parents:
diff changeset
373 } else if (OWLDataRange.class.isInstance(restrictionValues)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
374 RDFList dr = ((OWLDataRange) restrictionValues).getOneOf();
fb3f3df002df first release
dwinter
parents:
diff changeset
375 for (Object d : dr.getValues()) {
fb3f3df002df first release
dwinter
parents:
diff changeset
376 System.out.println(d);
fb3f3df002df first release
dwinter
parents:
diff changeset
377 toClass = (OWLNamedClass) d;
fb3f3df002df first release
dwinter
parents:
diff changeset
378 // FIXME: geht das??
fb3f3df002df first release
dwinter
parents:
diff changeset
379 }
fb3f3df002df first release
dwinter
parents:
diff changeset
380 } else if (DefaultOWLUnionClass.class.isInstance(restrictionValues)) { // mehr
fb3f3df002df first release
dwinter
parents:
diff changeset
381 // als
fb3f3df002df first release
dwinter
parents:
diff changeset
382 // eine
fb3f3df002df first release
dwinter
parents:
diff changeset
383 // moeglich
fb3f3df002df first release
dwinter
parents:
diff changeset
384 DefaultOWLUnionClass ou = (DefaultOWLUnionClass) restrictionValues;
fb3f3df002df first release
dwinter
parents:
diff changeset
385 Set set = new HashSet();
fb3f3df002df first release
dwinter
parents:
diff changeset
386 ou.getNestedNamedClasses(set);
fb3f3df002df first release
dwinter
parents:
diff changeset
387
fb3f3df002df first release
dwinter
parents:
diff changeset
388 for (Iterator<?> it = set.iterator(); it.hasNext();) {
fb3f3df002df first release
dwinter
parents:
diff changeset
389 OWLNamedClass cl = (OWLNamedClass) it.next();
fb3f3df002df first release
dwinter
parents:
diff changeset
390 OWLNamedClass idcls = owlDoc.owlModel
fb3f3df002df first release
dwinter
parents:
diff changeset
391 .getOWLNamedClass("Identifier"); // nimm die Klasse die
fb3f3df002df first release
dwinter
parents:
diff changeset
392 // ein Identifier
fb3f3df002df first release
dwinter
parents:
diff changeset
393 // ist.
fb3f3df002df first release
dwinter
parents:
diff changeset
394 if (cl.getNamedSuperclasses(true).contains(idcls)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
395 toClass = cl;
fb3f3df002df first release
dwinter
parents:
diff changeset
396 break;
fb3f3df002df first release
dwinter
parents:
diff changeset
397 }
fb3f3df002df first release
dwinter
parents:
diff changeset
398
fb3f3df002df first release
dwinter
parents:
diff changeset
399 }
fb3f3df002df first release
dwinter
parents:
diff changeset
400 }
fb3f3df002df first release
dwinter
parents:
diff changeset
401 return toClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
402 }
fb3f3df002df first release
dwinter
parents:
diff changeset
403
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
404
0
fb3f3df002df first release
dwinter
parents:
diff changeset
405
fb3f3df002df first release
dwinter
parents:
diff changeset
406 private OWLIndividual handleNameWithRole(OWLIndividual recordInd,
fb3f3df002df first release
dwinter
parents:
diff changeset
407 String name, String role) {
fb3f3df002df first release
dwinter
parents:
diff changeset
408 // teste ob schon ein solcer Eintrag existiert
fb3f3df002df first release
dwinter
parents:
diff changeset
409 OWLIndividual nameInd = owlDoc.getIndividualByReadableId(
fb3f3df002df first release
dwinter
parents:
diff changeset
410 "IndicesNames", name);
fb3f3df002df first release
dwinter
parents:
diff changeset
411 Boolean createNewNameWithRole = false;
fb3f3df002df first release
dwinter
parents:
diff changeset
412 if (nameInd == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
413 nameInd = createOrGetName(name);
fb3f3df002df first release
dwinter
parents:
diff changeset
414 createNewNameWithRole = true; // name existierte nicht dann kann
fb3f3df002df first release
dwinter
parents:
diff changeset
415 // auch NameWithRole nicht
fb3f3df002df first release
dwinter
parents:
diff changeset
416 // existierten.
fb3f3df002df first release
dwinter
parents:
diff changeset
417 }
fb3f3df002df first release
dwinter
parents:
diff changeset
418 OWLIndividual roleInd = owlDoc.getIndividualByReadableId(
fb3f3df002df first release
dwinter
parents:
diff changeset
419 "IndicesRoles", role);
fb3f3df002df first release
dwinter
parents:
diff changeset
420 if (roleInd == null) {
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
421 roleInd = createOrGetRole(role);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
422 createNewNameWithRole = true; // role existierte nicht dann kann
fb3f3df002df first release
dwinter
parents:
diff changeset
423 // auch NameWithRole nicht
fb3f3df002df first release
dwinter
parents:
diff changeset
424 // existierten.
fb3f3df002df first release
dwinter
parents:
diff changeset
425 }
fb3f3df002df first release
dwinter
parents:
diff changeset
426 OWLIndividual nameWithRoleInd = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
427 if (!createNewNameWithRole) { // schon klar, dass er nicht existiert
fb3f3df002df first release
dwinter
parents:
diff changeset
428 nameWithRoleInd = getNameWithRole(nameInd, roleInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
429 }
fb3f3df002df first release
dwinter
parents:
diff changeset
430
fb3f3df002df first release
dwinter
parents:
diff changeset
431 if (nameWithRoleInd == null) { // existiert nicht
fb3f3df002df first release
dwinter
parents:
diff changeset
432 nameWithRoleInd = createNameWithRole(nameInd, roleInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
433 }
fb3f3df002df first release
dwinter
parents:
diff changeset
434
fb3f3df002df first release
dwinter
parents:
diff changeset
435 return nameWithRoleInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
436 }
fb3f3df002df first release
dwinter
parents:
diff changeset
437
fb3f3df002df first release
dwinter
parents:
diff changeset
438 private OWLIndividual getNameWithRole(OWLIndividual nameInd,
fb3f3df002df first release
dwinter
parents:
diff changeset
439 OWLIndividual roleInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
440 List<OWLIndividual> indicesWithNames = owlDoc.getIndividuals(
fb3f3df002df first release
dwinter
parents:
diff changeset
441 "IndicesNameWithRole", "refers_to_name", nameInd); // suche alle
fb3f3df002df first release
dwinter
parents:
diff changeset
442 // infrage
fb3f3df002df first release
dwinter
parents:
diff changeset
443 // kommenden
fb3f3df002df first release
dwinter
parents:
diff changeset
444 // nameen
fb3f3df002df first release
dwinter
parents:
diff changeset
445
fb3f3df002df first release
dwinter
parents:
diff changeset
446 if (indicesWithNames == null) { // kein Treffer
fb3f3df002df first release
dwinter
parents:
diff changeset
447 return null;
fb3f3df002df first release
dwinter
parents:
diff changeset
448 }
fb3f3df002df first release
dwinter
parents:
diff changeset
449
fb3f3df002df first release
dwinter
parents:
diff changeset
450 for (OWLIndividual name : indicesWithNames) {
fb3f3df002df first release
dwinter
parents:
diff changeset
451 Object role = owlDoc.getRelatedIndividual(name, "refers_to_role");
fb3f3df002df first release
dwinter
parents:
diff changeset
452 if (roleInd.equals(role)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
453 return name;
fb3f3df002df first release
dwinter
parents:
diff changeset
454 }
fb3f3df002df first release
dwinter
parents:
diff changeset
455 }
fb3f3df002df first release
dwinter
parents:
diff changeset
456 return null;
fb3f3df002df first release
dwinter
parents:
diff changeset
457 }
fb3f3df002df first release
dwinter
parents:
diff changeset
458
fb3f3df002df first release
dwinter
parents:
diff changeset
459 private OWLIndividual createOrGetTipol(String typology) {
fb3f3df002df first release
dwinter
parents:
diff changeset
460 OWLIndividual tipol = owlDoc.createOrGetInstanceWithIdentifier("Typology","Identifier",typology);
fb3f3df002df first release
dwinter
parents:
diff changeset
461 return tipol;
fb3f3df002df first release
dwinter
parents:
diff changeset
462 }
fb3f3df002df first release
dwinter
parents:
diff changeset
463
fb3f3df002df first release
dwinter
parents:
diff changeset
464 private OWLIndividual createNameWithRole(OWLIndividual nameInd,
fb3f3df002df first release
dwinter
parents:
diff changeset
465 OWLIndividual roleInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
466
fb3f3df002df first release
dwinter
parents:
diff changeset
467 OWLIndividual nameWithRoleInd = owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
468 .createInstance("IndicesNameWithRole");
fb3f3df002df first release
dwinter
parents:
diff changeset
469
fb3f3df002df first release
dwinter
parents:
diff changeset
470 owlDoc.setProperty(nameWithRoleInd, "refers_to_name", nameInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
471 owlDoc.setProperty(nameWithRoleInd, "refers_to_role", roleInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
472
fb3f3df002df first release
dwinter
parents:
diff changeset
473 return nameWithRoleInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
474
fb3f3df002df first release
dwinter
parents:
diff changeset
475 }
fb3f3df002df first release
dwinter
parents:
diff changeset
476
fb3f3df002df first release
dwinter
parents:
diff changeset
477 private OWLIndividual createOrGetInstitution(String name) {
fb3f3df002df first release
dwinter
parents:
diff changeset
478 OWLIndividual nameInd = owlDoc.createOrGetInstanceWithIdentifier("IndicesInstitutions","IdentifierInstitutions",name);
fb3f3df002df first release
dwinter
parents:
diff changeset
479
fb3f3df002df first release
dwinter
parents:
diff changeset
480 return nameInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
481 }
fb3f3df002df first release
dwinter
parents:
diff changeset
482
fb3f3df002df first release
dwinter
parents:
diff changeset
483 private OWLIndividual createOrGetName(String name) {
fb3f3df002df first release
dwinter
parents:
diff changeset
484 OWLIndividual nameInd = owlDoc.createOrGetInstanceWithIdentifier("IndicesNames","IdentifierNames",name);
fb3f3df002df first release
dwinter
parents:
diff changeset
485 return nameInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
486 }
fb3f3df002df first release
dwinter
parents:
diff changeset
487
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
488 private OWLIndividual createOrGetRole(String name) {
0
fb3f3df002df first release
dwinter
parents:
diff changeset
489 OWLIndividual roleInd = owlDoc.createOrGetInstanceWithIdentifier("IndicesRoles","IdentifierRoles",name);
fb3f3df002df first release
dwinter
parents:
diff changeset
490 return roleInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
491 }
fb3f3df002df first release
dwinter
parents:
diff changeset
492
fb3f3df002df first release
dwinter
parents:
diff changeset
493 private OWLIndividual createRecord(Element record, OWLIndividual cardInd)
fb3f3df002df first release
dwinter
parents:
diff changeset
494 throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
495 OWLIndividual recordInstance = owlDoc.createInstance("Record");
fb3f3df002df first release
dwinter
parents:
diff changeset
496 owlDoc.setProperty(recordInstance, "is_on_card", cardInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
497 createNewDependingInstanceFromXpath(record, recordInstance, "./@id",
fb3f3df002df first release
dwinter
parents:
diff changeset
498 new String[] { "has_readable_id", "rdfs:label" },
fb3f3df002df first release
dwinter
parents:
diff changeset
499 "IdentifierCurrent", "crm:P48_has_preferred_identifier");
fb3f3df002df first release
dwinter
parents:
diff changeset
500
fb3f3df002df first release
dwinter
parents:
diff changeset
501 String value = lexDoc.getValue(record, ".//textblockid");
fb3f3df002df first release
dwinter
parents:
diff changeset
502 if (!value.equals(""))
fb3f3df002df first release
dwinter
parents:
diff changeset
503 owlDoc.setProperty(recordInstance, "has_textblockid", value);
fb3f3df002df first release
dwinter
parents:
diff changeset
504
fb3f3df002df first release
dwinter
parents:
diff changeset
505 String endOnCarta = lexDoc.getValue(record, "./@end_on_carta");
fb3f3df002df first release
dwinter
parents:
diff changeset
506 if (!endOnCarta.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
507 OWLIndividual signature = (OWLIndividual) owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
508 .getRelatedIndividual(cardInd, "has_signature");
fb3f3df002df first release
dwinter
parents:
diff changeset
509 addRecordToCarta(recordInstance, value, signature);
fb3f3df002df first release
dwinter
parents:
diff changeset
510 }
fb3f3df002df first release
dwinter
parents:
diff changeset
511
fb3f3df002df first release
dwinter
parents:
diff changeset
512 String dateDcStart = lexDoc.getValue(record, ".//datdc/startdate");
fb3f3df002df first release
dwinter
parents:
diff changeset
513 String dateDcEnd = lexDoc.getValue(record, ".//datdc/startdate");
fb3f3df002df first release
dwinter
parents:
diff changeset
514
fb3f3df002df first release
dwinter
parents:
diff changeset
515 OWLIndividual timeSpan = owlDoc.createTimeSpan(dateDcStart, dateDcEnd);
fb3f3df002df first release
dwinter
parents:
diff changeset
516
fb3f3df002df first release
dwinter
parents:
diff changeset
517 owlDoc.setProperty(recordInstance, "crm:P4_has_time-span", timeSpan);
fb3f3df002df first release
dwinter
parents:
diff changeset
518
fb3f3df002df first release
dwinter
parents:
diff changeset
519 return recordInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
520 }
fb3f3df002df first release
dwinter
parents:
diff changeset
521
fb3f3df002df first release
dwinter
parents:
diff changeset
522 private void addRecordToCarta(OWLIndividual recordInstance, String cardID,
fb3f3df002df first release
dwinter
parents:
diff changeset
523 OWLIndividual signature) {
fb3f3df002df first release
dwinter
parents:
diff changeset
524
fb3f3df002df first release
dwinter
parents:
diff changeset
525 OWLIndividual card = owlDoc.getIndividualByReadableId("Card", cardID);
fb3f3df002df first release
dwinter
parents:
diff changeset
526
fb3f3df002df first release
dwinter
parents:
diff changeset
527 if (card == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
528 card = createCard(cardID, signature);
fb3f3df002df first release
dwinter
parents:
diff changeset
529 }
fb3f3df002df first release
dwinter
parents:
diff changeset
530
fb3f3df002df first release
dwinter
parents:
diff changeset
531 owlDoc.setProperty(recordInstance, "is_on_card", card);
fb3f3df002df first release
dwinter
parents:
diff changeset
532 }
fb3f3df002df first release
dwinter
parents:
diff changeset
533
fb3f3df002df first release
dwinter
parents:
diff changeset
534 private OWLIndividual createSignature(Element signature)
fb3f3df002df first release
dwinter
parents:
diff changeset
535 throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
536 Element segHeaderElement = (Element) XPath.selectSingleNode(signature,
fb3f3df002df first release
dwinter
parents:
diff changeset
537 ".//segheader");
fb3f3df002df first release
dwinter
parents:
diff changeset
538 String segheader = segHeaderElement.getTextTrim();
fb3f3df002df first release
dwinter
parents:
diff changeset
539
fb3f3df002df first release
dwinter
parents:
diff changeset
540 OWLIndividual signatureInstance = owlDoc.createInstance("Signatur");
fb3f3df002df first release
dwinter
parents:
diff changeset
541 owlDoc.setProperty(signatureInstance, "rdfs:label", segheader);
fb3f3df002df first release
dwinter
parents:
diff changeset
542 return signatureInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
543 }
fb3f3df002df first release
dwinter
parents:
diff changeset
544
fb3f3df002df first release
dwinter
parents:
diff changeset
545 private OWLIndividual createCard(String cardId, OWLIndividual signature) {
fb3f3df002df first release
dwinter
parents:
diff changeset
546
fb3f3df002df first release
dwinter
parents:
diff changeset
547 OWLIndividual cardInstance = owlDoc.createInstance("Card");
fb3f3df002df first release
dwinter
parents:
diff changeset
548
fb3f3df002df first release
dwinter
parents:
diff changeset
549 owlDoc.setProperty(cardInstance, "has_signature", signature);
fb3f3df002df first release
dwinter
parents:
diff changeset
550
fb3f3df002df first release
dwinter
parents:
diff changeset
551 OWLIndividual preferredId = owlDoc.createInstance("IdentifierCurrent");
fb3f3df002df first release
dwinter
parents:
diff changeset
552 owlDoc.setProperty(preferredId, "has_readable_id", cardId);
fb3f3df002df first release
dwinter
parents:
diff changeset
553 owlDoc.setProperty(preferredId, "rdfs:label", cardId);
fb3f3df002df first release
dwinter
parents:
diff changeset
554
fb3f3df002df first release
dwinter
parents:
diff changeset
555 owlDoc.setProperty(cardInstance, "crm:P48_has_preferred_identifier",
fb3f3df002df first release
dwinter
parents:
diff changeset
556 preferredId);
fb3f3df002df first release
dwinter
parents:
diff changeset
557
fb3f3df002df first release
dwinter
parents:
diff changeset
558 return cardInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
559 }
fb3f3df002df first release
dwinter
parents:
diff changeset
560
fb3f3df002df first release
dwinter
parents:
diff changeset
561 private OWLIndividual createCard(Element card, OWLIndividual signatureInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
562
fb3f3df002df first release
dwinter
parents:
diff changeset
563 OWLIndividual cardInstance = owlDoc.createInstance("Card");
fb3f3df002df first release
dwinter
parents:
diff changeset
564
fb3f3df002df first release
dwinter
parents:
diff changeset
565 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
566
fb3f3df002df first release
dwinter
parents:
diff changeset
567 createNewDependingInstanceFromXpath(card, cardInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
568 ".//cartanr", new String[] { "has_readable_id",
fb3f3df002df first release
dwinter
parents:
diff changeset
569 "rdfs:label" }, "IdentifierCurrent",
fb3f3df002df first release
dwinter
parents:
diff changeset
570 "crm:P48_has_preferred_identifier");
fb3f3df002df first release
dwinter
parents:
diff changeset
571
fb3f3df002df first release
dwinter
parents:
diff changeset
572 createNewDependingInstanceFromXpath(card, cardInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
573 ".//cartaant", new String[] { "has_readable_id",
fb3f3df002df first release
dwinter
parents:
diff changeset
574 "rdfs:label" }, "IdentifierCurrent",
fb3f3df002df first release
dwinter
parents:
diff changeset
575 "crm:P1_is_identified_by");
fb3f3df002df first release
dwinter
parents:
diff changeset
576
fb3f3df002df first release
dwinter
parents:
diff changeset
577 owlDoc.setProperty(cardInstance, "has_signature", signatureInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
578
fb3f3df002df first release
dwinter
parents:
diff changeset
579 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
580 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
581 return null;
fb3f3df002df first release
dwinter
parents:
diff changeset
582 }
fb3f3df002df first release
dwinter
parents:
diff changeset
583
fb3f3df002df first release
dwinter
parents:
diff changeset
584 return cardInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
585 }
fb3f3df002df first release
dwinter
parents:
diff changeset
586
fb3f3df002df first release
dwinter
parents:
diff changeset
587 private void createNewDependingInstanceFromXpath(Element card,
fb3f3df002df first release
dwinter
parents:
diff changeset
588 OWLIndividual cardInstance, String xpath, String[] propertyNames,
fb3f3df002df first release
dwinter
parents:
diff changeset
589 String newInstanceClassName, String relationNameToNewInstance)
fb3f3df002df first release
dwinter
parents:
diff changeset
590 throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
591
fb3f3df002df first release
dwinter
parents:
diff changeset
592 List<?> identifierIdEls = (List<?>) XPath.selectNodes(card, xpath);
fb3f3df002df first release
dwinter
parents:
diff changeset
593 for (Object identifierIdEl : identifierIdEls) {
fb3f3df002df first release
dwinter
parents:
diff changeset
594 String identifierId = "";
fb3f3df002df first release
dwinter
parents:
diff changeset
595 if (Element.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
596 identifierId = ((Element) identifierIdEl).getTextTrim();
fb3f3df002df first release
dwinter
parents:
diff changeset
597 } else if (Attribute.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
598 identifierId = ((Attribute) identifierIdEl).getValue();
fb3f3df002df first release
dwinter
parents:
diff changeset
599 }
fb3f3df002df first release
dwinter
parents:
diff changeset
600
fb3f3df002df first release
dwinter
parents:
diff changeset
601 OWLIndividual identifier = owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
602 .createInstance(newInstanceClassName);
fb3f3df002df first release
dwinter
parents:
diff changeset
603 for (int i = 0; i < propertyNames.length; i++) {
fb3f3df002df first release
dwinter
parents:
diff changeset
604 owlDoc.setProperty(identifier, propertyNames[i], identifierId);
fb3f3df002df first release
dwinter
parents:
diff changeset
605 }
fb3f3df002df first release
dwinter
parents:
diff changeset
606
fb3f3df002df first release
dwinter
parents:
diff changeset
607 owlDoc.setProperty(cardInstance, relationNameToNewInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
608 identifier);
fb3f3df002df first release
dwinter
parents:
diff changeset
609 }
fb3f3df002df first release
dwinter
parents:
diff changeset
610
fb3f3df002df first release
dwinter
parents:
diff changeset
611 }
fb3f3df002df first release
dwinter
parents:
diff changeset
612
fb3f3df002df first release
dwinter
parents:
diff changeset
613 // createNewDependingDataTypePropertyFromXpath(record, eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
614 // ".//resges/italian", "has_reges",
fb3f3df002df first release
dwinter
parents:
diff changeset
615 // "italian");
fb3f3df002df first release
dwinter
parents:
diff changeset
616 private void createNewDependingDataTypePropertyFromXpath(Element record,
fb3f3df002df first release
dwinter
parents:
diff changeset
617 OWLIndividual eventInstance, String xpath, String propertyName,
fb3f3df002df first release
dwinter
parents:
diff changeset
618 String lang) throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
619
fb3f3df002df first release
dwinter
parents:
diff changeset
620 List<?> identifierIdEls = (List<?>) XPath.selectNodes(record, xpath);
fb3f3df002df first release
dwinter
parents:
diff changeset
621 for (Object identifierIdEl : identifierIdEls) {
fb3f3df002df first release
dwinter
parents:
diff changeset
622 String identifierId = "";
fb3f3df002df first release
dwinter
parents:
diff changeset
623 if (Element.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
624 identifierId = ((Element) identifierIdEl).getTextTrim();
fb3f3df002df first release
dwinter
parents:
diff changeset
625 } else if (Attribute.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
626 identifierId = ((Attribute) identifierIdEl).getValue();
fb3f3df002df first release
dwinter
parents:
diff changeset
627 }
fb3f3df002df first release
dwinter
parents:
diff changeset
628
fb3f3df002df first release
dwinter
parents:
diff changeset
629 owlDoc.setDataTypePropery(eventInstance, propertyName,
fb3f3df002df first release
dwinter
parents:
diff changeset
630 identifierId, lang);
fb3f3df002df first release
dwinter
parents:
diff changeset
631 }
fb3f3df002df first release
dwinter
parents:
diff changeset
632 }
fb3f3df002df first release
dwinter
parents:
diff changeset
633 }