annotate src/de/mpiwg/dwinter/duomo/lexdump/LexOWLTransformer.java @ 9:4392a6adf85a default tip

new version der label mit language tag
author dwinter
date Thu, 16 Aug 2012 11:40:17 +0200
parents 919e9f3b5efd
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
fb3f3df002df first release
dwinter
parents:
diff changeset
1 package de.mpiwg.dwinter.duomo.lexdump;
fb3f3df002df first release
dwinter
parents:
diff changeset
2
1
dwinter
parents: 0
diff changeset
3 import java.io.File;
dwinter
parents: 0
diff changeset
4 import java.io.FileWriter;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
5 import java.io.IOException;
fb3f3df002df first release
dwinter
parents:
diff changeset
6 import java.net.URI;
fb3f3df002df first release
dwinter
parents:
diff changeset
7 import java.net.URISyntaxException;
fb3f3df002df first release
dwinter
parents:
diff changeset
8 import java.net.URLEncoder;
fb3f3df002df first release
dwinter
parents:
diff changeset
9 import java.util.Collection;
fb3f3df002df first release
dwinter
parents:
diff changeset
10 import java.util.HashMap;
fb3f3df002df first release
dwinter
parents:
diff changeset
11 import java.util.HashSet;
fb3f3df002df first release
dwinter
parents:
diff changeset
12 import java.util.Iterator;
fb3f3df002df first release
dwinter
parents:
diff changeset
13 import java.util.List;
fb3f3df002df first release
dwinter
parents:
diff changeset
14 import java.util.Map;
fb3f3df002df first release
dwinter
parents:
diff changeset
15 import java.util.Set;
fb3f3df002df first release
dwinter
parents:
diff changeset
16
fb3f3df002df first release
dwinter
parents:
diff changeset
17 import javax.print.URIException;
fb3f3df002df first release
dwinter
parents:
diff changeset
18
fb3f3df002df first release
dwinter
parents:
diff changeset
19 import org.apache.log4j.Level;
fb3f3df002df first release
dwinter
parents:
diff changeset
20 import org.apache.log4j.Logger;
fb3f3df002df first release
dwinter
parents:
diff changeset
21 import org.jdom.Attribute;
fb3f3df002df first release
dwinter
parents:
diff changeset
22 import org.jdom.Element;
fb3f3df002df first release
dwinter
parents:
diff changeset
23 import org.jdom.JDOMException;
fb3f3df002df first release
dwinter
parents:
diff changeset
24 import org.jdom.xpath.XPath;
fb3f3df002df first release
dwinter
parents:
diff changeset
25
fb3f3df002df first release
dwinter
parents:
diff changeset
26 import com.sun.xml.internal.ws.developer.MemberSubmissionEndpointReference.Elements;
fb3f3df002df first release
dwinter
parents:
diff changeset
27
fb3f3df002df first release
dwinter
parents:
diff changeset
28 import edu.stanford.smi.protege.exception.OntologyLoadException;
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
29 import edu.stanford.smi.protege.model.Facet;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
30 import edu.stanford.smi.protege.model.Instance;
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
31 import edu.stanford.smi.protege.model.Slot;
4
72004a788198 save single file
dwinter
parents: 3
diff changeset
32 import edu.stanford.smi.protegex.owl.jena.JenaOWLModel;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
33 import edu.stanford.smi.protegex.owl.model.OWLAllValuesFrom;
fb3f3df002df first release
dwinter
parents:
diff changeset
34 import edu.stanford.smi.protegex.owl.model.OWLClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
35 import edu.stanford.smi.protegex.owl.model.OWLDataRange;
fb3f3df002df first release
dwinter
parents:
diff changeset
36 import edu.stanford.smi.protegex.owl.model.OWLIndividual;
fb3f3df002df first release
dwinter
parents:
diff changeset
37 import edu.stanford.smi.protegex.owl.model.OWLNamedClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
38 import edu.stanford.smi.protegex.owl.model.OWLProperty;
fb3f3df002df first release
dwinter
parents:
diff changeset
39 import edu.stanford.smi.protegex.owl.model.OWLUnionClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
40 import edu.stanford.smi.protegex.owl.model.RDFList;
fb3f3df002df first release
dwinter
parents:
diff changeset
41 import edu.stanford.smi.protegex.owl.model.RDFProperty;
fb3f3df002df first release
dwinter
parents:
diff changeset
42 import edu.stanford.smi.protegex.owl.model.RDFResource;
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
43 import edu.stanford.smi.protegex.owl.model.RDFSClass;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
44 import edu.stanford.smi.protegex.owl.model.impl.AbstractOWLQuantifierRestriction;
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
45 import edu.stanford.smi.protegex.owl.model.impl.AbstractOWLRestriction;
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
46 import edu.stanford.smi.protegex.owl.model.impl.DefaultOWLAllValuesFrom;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
47 import edu.stanford.smi.protegex.owl.model.impl.DefaultOWLUnionClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
48
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
49 /**
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
50 * @author dwinter
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
51 *
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
52 *Transformiert die Lex Files in OWL
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
53 */
0
fb3f3df002df first release
dwinter
parents:
diff changeset
54 public class LexOWLTransformer {
fb3f3df002df first release
dwinter
parents:
diff changeset
55 private Logger logger = Logger.getRootLogger();
1
dwinter
parents: 0
diff changeset
56 private FileWriter missing;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
57 private OWLImporter owlDoc;
fb3f3df002df first release
dwinter
parents:
diff changeset
58 private LexDumpImporter lexDoc;
fb3f3df002df first release
dwinter
parents:
diff changeset
59 private Map<String, OWLIndividual> individualIds = new HashMap<String, OWLIndividual>(); // speichere
fb3f3df002df first release
dwinter
parents:
diff changeset
60 // ids
fb3f3df002df first release
dwinter
parents:
diff changeset
61 // fuer
fb3f3df002df first release
dwinter
parents:
diff changeset
62 // weitere
fb3f3df002df first release
dwinter
parents:
diff changeset
63 // Verwendung
fb3f3df002df first release
dwinter
parents:
diff changeset
64
1
dwinter
parents: 0
diff changeset
65 public LexOWLTransformer(OWLImporter owlDoc, LexDumpImporter lexDoc) throws IOException {
0
fb3f3df002df first release
dwinter
parents:
diff changeset
66 this.owlDoc = owlDoc;
fb3f3df002df first release
dwinter
parents:
diff changeset
67 this.lexDoc = lexDoc;
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
68 missing = new FileWriter(new File("/tmp/missing.out"));
0
fb3f3df002df first release
dwinter
parents:
diff changeset
69 }
fb3f3df002df first release
dwinter
parents:
diff changeset
70
fb3f3df002df first release
dwinter
parents:
diff changeset
71 /**
fb3f3df002df first release
dwinter
parents:
diff changeset
72 * @param args
fb3f3df002df first release
dwinter
parents:
diff changeset
73 * @throws Exception
fb3f3df002df first release
dwinter
parents:
diff changeset
74 */
fb3f3df002df first release
dwinter
parents:
diff changeset
75 public static void main(String[] args) throws Exception {
6
30fc93374f10 minor changes
dwinter
parents: 5
diff changeset
76 System.out.println("Stack size has to be large, use at least -Xmx3048M -Xss10M");
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
77 if (args.length<2){
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
78 System.out.println("Usage: \"/Users/dwinter/Documents/Projekte/Diss - data-mining/eclipseWorkspace/de.mpiwg.dwinter.duomo/owlInput\""+
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
79 "\"/Users/dwinter/Documents/Projekte/Diss - data-mining/eclipseWorkspace/duomoData/LEXXDUMP.xml\"");
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
80 System.exit(-1);
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
81 }
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
82
0
fb3f3df002df first release
dwinter
parents:
diff changeset
83 Logger.getRootLogger().setLevel(Level.DEBUG);
fb3f3df002df first release
dwinter
parents:
diff changeset
84 // Import OWL
fb3f3df002df first release
dwinter
parents:
diff changeset
85 //String base = "/Users/dwinter/Documents/Projekte/Diss - data-mining/eclipseWorkspace/de.mpiwg.dwinter.duomo/owlInput";
fb3f3df002df first release
dwinter
parents:
diff changeset
86 String base=args[0];
fb3f3df002df first release
dwinter
parents:
diff changeset
87 String baseUri= base.replace(" ", "%20");
fb3f3df002df first release
dwinter
parents:
diff changeset
88 URI ontologieUri = new URI("file://"+baseUri+"/duomoAnalysis.owl");
fb3f3df002df first release
dwinter
parents:
diff changeset
89 //URI ontologieUri = new URI(
fb3f3df002df first release
dwinter
parents:
diff changeset
90 // "file:///Users/dwinter/Documents/Projekte/Diss%20-%20data-mining/eclipseWorkspace/de.mpiwg.dwinter.duomo/owlInput/duomoAnalysis.owl");
fb3f3df002df first release
dwinter
parents:
diff changeset
91 OWLImporter owlDoc = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
92 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
93
fb3f3df002df first release
dwinter
parents:
diff changeset
94 owlDoc = new OWLImporter(base, ontologieUri);
fb3f3df002df first release
dwinter
parents:
diff changeset
95 // owlDoc.printModel();
fb3f3df002df first release
dwinter
parents:
diff changeset
96 } catch (OntologyLoadException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
97 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
98 System.exit(-1);
fb3f3df002df first release
dwinter
parents:
diff changeset
99 }
fb3f3df002df first release
dwinter
parents:
diff changeset
100 // read and parse lexfile
fb3f3df002df first release
dwinter
parents:
diff changeset
101 //String lexFile = "/Users/dwinter/Documents/Projekte/Diss - data-mining/eclipseWorkspace/duomoData/LEXXDUMP.xml";
fb3f3df002df first release
dwinter
parents:
diff changeset
102 String lexFile=args[1];
fb3f3df002df first release
dwinter
parents:
diff changeset
103 LexDumpImporter lexDoc = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
104 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
105 lexDoc = new LexDumpImporter(lexFile);
fb3f3df002df first release
dwinter
parents:
diff changeset
106 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
107 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
108 System.exit(-1);
fb3f3df002df first release
dwinter
parents:
diff changeset
109 } catch (IOException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
110 System.exit(-1);
fb3f3df002df first release
dwinter
parents:
diff changeset
111 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
112 }
fb3f3df002df first release
dwinter
parents:
diff changeset
113
fb3f3df002df first release
dwinter
parents:
diff changeset
114 // List<Element> cartas = lexDoc.getCartas();
fb3f3df002df first release
dwinter
parents:
diff changeset
115 // System.out.println(cartas.size());
fb3f3df002df first release
dwinter
parents:
diff changeset
116
fb3f3df002df first release
dwinter
parents:
diff changeset
117 LexOWLTransformer tf = new LexOWLTransformer(owlDoc, lexDoc);
fb3f3df002df first release
dwinter
parents:
diff changeset
118 tf.transform();
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
119 //owlDoc.save("file:///tmp/out.owl");
0
fb3f3df002df first release
dwinter
parents:
diff changeset
120 }
fb3f3df002df first release
dwinter
parents:
diff changeset
121
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
122 /**
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
123 * Hautmethoden zur Transformation
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
124 * @throws URISyntaxException
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
125 * @throws Exception
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
126 */
4
72004a788198 save single file
dwinter
parents: 3
diff changeset
127 private void transform() throws URISyntaxException, Exception {
0
fb3f3df002df first release
dwinter
parents:
diff changeset
128 List<Element> signatures = lexDoc.getSignatures();
fb3f3df002df first release
dwinter
parents:
diff changeset
129
fb3f3df002df first release
dwinter
parents:
diff changeset
130 // Element signature = signatures.get(0);
4
72004a788198 save single file
dwinter
parents: 3
diff changeset
131 int signatureCount = 0;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
132 int maxsign = signatures.size();
fb3f3df002df first release
dwinter
parents:
diff changeset
133 for (Element signature : signatures) {
fb3f3df002df first release
dwinter
parents:
diff changeset
134 logger.debug(String.format("Signature: %s (%s)", signatureCount,
fb3f3df002df first release
dwinter
parents:
diff changeset
135 maxsign));
4
72004a788198 save single file
dwinter
parents: 3
diff changeset
136
72004a788198 save single file
dwinter
parents: 3
diff changeset
137 signatureCount++;
72004a788198 save single file
dwinter
parents: 3
diff changeset
138 //if (signatureCount<5 || signatureCount>10)
72004a788198 save single file
dwinter
parents: 3
diff changeset
139 // continue;
0
fb3f3df002df first release
dwinter
parents:
diff changeset
140 OWLIndividual signatureInd = createSignature(signature);
fb3f3df002df first release
dwinter
parents:
diff changeset
141
fb3f3df002df first release
dwinter
parents:
diff changeset
142 @SuppressWarnings("unchecked")
fb3f3df002df first release
dwinter
parents:
diff changeset
143 List<Element> cards = XPath.selectNodes(signature, ".//carta");
fb3f3df002df first release
dwinter
parents:
diff changeset
144 int cardsCount = 1;
fb3f3df002df first release
dwinter
parents:
diff changeset
145 int maxcards = cards.size();
fb3f3df002df first release
dwinter
parents:
diff changeset
146
fb3f3df002df first release
dwinter
parents:
diff changeset
147 // Element card=cards.get(0);
fb3f3df002df first release
dwinter
parents:
diff changeset
148 for (Element card : cards) {
fb3f3df002df first release
dwinter
parents:
diff changeset
149 logger.debug(String.format("Cards: %s (%s)", cardsCount++,
fb3f3df002df first release
dwinter
parents:
diff changeset
150 maxcards));
fb3f3df002df first release
dwinter
parents:
diff changeset
151 logger.debug(String.format("Signature: %s (%s)",
fb3f3df002df first release
dwinter
parents:
diff changeset
152 signatureCount, maxsign));
fb3f3df002df first release
dwinter
parents:
diff changeset
153 OWLIndividual cardInd = createCard(card, signatureInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
154
fb3f3df002df first release
dwinter
parents:
diff changeset
155 @SuppressWarnings("unchecked")
fb3f3df002df first release
dwinter
parents:
diff changeset
156 List<Element> records = XPath.selectNodes(card, ".//record");
fb3f3df002df first release
dwinter
parents:
diff changeset
157 for (Element record : records) {
fb3f3df002df first release
dwinter
parents:
diff changeset
158 // Element record = records.get(0);
fb3f3df002df first release
dwinter
parents:
diff changeset
159 OWLIndividual recordInd = createRecord(record, cardInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
160 OWLIndividual recordEvent = createEvent(record, recordInd); // Event
fb3f3df002df first release
dwinter
parents:
diff changeset
161 // und
fb3f3df002df first release
dwinter
parents:
diff changeset
162 // Records
fb3f3df002df first release
dwinter
parents:
diff changeset
163 // sind
fb3f3df002df first release
dwinter
parents:
diff changeset
164 // im
fb3f3df002df first release
dwinter
parents:
diff changeset
165 // Original
fb3f3df002df first release
dwinter
parents:
diff changeset
166 // im
fb3f3df002df first release
dwinter
parents:
diff changeset
167 // record-tag
fb3f3df002df first release
dwinter
parents:
diff changeset
168 }
fb3f3df002df first release
dwinter
parents:
diff changeset
169 }
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
170 //owlDoc.save("file:///tmp/out"+String.valueOf(signatureCount)+".owl");
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
171 //logger.debug("Saved:"+"/tmp/out"+String.valueOf(signatureCount)+".owl");
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
172 //owlDoc.reloadOWL();
0
fb3f3df002df first release
dwinter
parents:
diff changeset
173 }
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
174 owlDoc.printModel();
0
fb3f3df002df first release
dwinter
parents:
diff changeset
175 }
fb3f3df002df first release
dwinter
parents:
diff changeset
176
fb3f3df002df first release
dwinter
parents:
diff changeset
177 private OWLIndividual createEvent(Element record, OWLIndividual recordInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
178
fb3f3df002df first release
dwinter
parents:
diff changeset
179 logger.debug("Create Event");
fb3f3df002df first release
dwinter
parents:
diff changeset
180 OWLIndividual eventInstance = owlDoc.createInstance("RecordedEvent");
fb3f3df002df first release
dwinter
parents:
diff changeset
181
fb3f3df002df first release
dwinter
parents:
diff changeset
182 owlDoc.setProperty(recordInd, "crm:P70_documents", eventInstance);
fb3f3df002df first release
dwinter
parents:
diff changeset
183
fb3f3df002df first release
dwinter
parents:
diff changeset
184 // timespan
fb3f3df002df first release
dwinter
parents:
diff changeset
185
fb3f3df002df first release
dwinter
parents:
diff changeset
186 try {
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
187 String dateDcStart = lexDoc.getValue(record, ".//datrf/startdate");
0
fb3f3df002df first release
dwinter
parents:
diff changeset
188
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
189 String dateDcEnd = lexDoc.getValue(record, ".//datrf/enddate");
0
fb3f3df002df first release
dwinter
parents:
diff changeset
190
fb3f3df002df first release
dwinter
parents:
diff changeset
191 if (!dateDcStart.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
192 OWLIndividual timeSpan = owlDoc.createTimeSpan(dateDcStart,
fb3f3df002df first release
dwinter
parents:
diff changeset
193 dateDcEnd);
fb3f3df002df first release
dwinter
parents:
diff changeset
194 owlDoc.setProperty(eventInstance, "crm:P4_has_time-span",
fb3f3df002df first release
dwinter
parents:
diff changeset
195 timeSpan);
fb3f3df002df first release
dwinter
parents:
diff changeset
196 }
fb3f3df002df first release
dwinter
parents:
diff changeset
197 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
198 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
199 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
200 }
fb3f3df002df first release
dwinter
parents:
diff changeset
201
fb3f3df002df first release
dwinter
parents:
diff changeset
202 // tipol
fb3f3df002df first release
dwinter
parents:
diff changeset
203 String typology;
fb3f3df002df first release
dwinter
parents:
diff changeset
204 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
205 typology = lexDoc.getValue(record, ".//tipol");
fb3f3df002df first release
dwinter
parents:
diff changeset
206 OWLIndividual typolInd = createOrGetTipol(typology);
fb3f3df002df first release
dwinter
parents:
diff changeset
207 owlDoc.setProperty(eventInstance, "has_tipol", typolInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
208
fb3f3df002df first release
dwinter
parents:
diff changeset
209 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
210 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
211 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
212 }
fb3f3df002df first release
dwinter
parents:
diff changeset
213
fb3f3df002df first release
dwinter
parents:
diff changeset
214 // reges
fb3f3df002df first release
dwinter
parents:
diff changeset
215 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
216 createNewDependingDataTypePropertyFromXpath(record, eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
217 ".//reges/italian", "has_reges", "it");
fb3f3df002df first release
dwinter
parents:
diff changeset
218 createNewDependingDataTypePropertyFromXpath(record, eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
219 ".//reges/english", "has_reges", "en");
fb3f3df002df first release
dwinter
parents:
diff changeset
220 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
221 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
222 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
223 }
fb3f3df002df first release
dwinter
parents:
diff changeset
224
fb3f3df002df first release
dwinter
parents:
diff changeset
225 // nomiq
fb3f3df002df first release
dwinter
parents:
diff changeset
226
fb3f3df002df first release
dwinter
parents:
diff changeset
227 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
228 @SuppressWarnings("unchecked")
fb3f3df002df first release
dwinter
parents:
diff changeset
229 List<Element> nomiqs = XPath.selectNodes(record, ".//nomiq");
fb3f3df002df first release
dwinter
parents:
diff changeset
230 OWLIndividual recordNamesRoles = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
231 for (Element nomiq : nomiqs) {
fb3f3df002df first release
dwinter
parents:
diff changeset
232 String name = lexDoc.getValue(nomiq, "./name");
fb3f3df002df first release
dwinter
parents:
diff changeset
233 String role = lexDoc.getValue(nomiq, "./role");
fb3f3df002df first release
dwinter
parents:
diff changeset
234
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
235 String provenance = lexDoc.getValue(nomiq, "./name/provenance");
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
236
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
237
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
238
0
fb3f3df002df first release
dwinter
parents:
diff changeset
239 if (!name.equals("") && !role.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
240 recordNamesRoles = handleNameWithRole(recordInd, name, role);
fb3f3df002df first release
dwinter
parents:
diff changeset
241 } else if (!role.equals("")) {
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
242 recordNamesRoles = createOrGetRole(role);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
243 } else if (!name.equals("")) {
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
244 recordNamesRoles = createOrGetName(name);
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
245 if (provenance!=""){
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
246 owlDoc.setDataTypePropery(recordNamesRoles, "has_provenance_as_string", provenance, "it");
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
247 }
0
fb3f3df002df first release
dwinter
parents:
diff changeset
248 }
fb3f3df002df first release
dwinter
parents:
diff changeset
249
fb3f3df002df first release
dwinter
parents:
diff changeset
250 if (recordNamesRoles != null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
251 owlDoc.setProperty(eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
252 "recordsDuomoObjectNameRoles", recordNamesRoles);
fb3f3df002df first release
dwinter
parents:
diff changeset
253 String id = lexDoc.getValue(nomiq, "./@id");
fb3f3df002df first release
dwinter
parents:
diff changeset
254 individualIds.put(id, recordNamesRoles);
fb3f3df002df first release
dwinter
parents:
diff changeset
255 }
fb3f3df002df first release
dwinter
parents:
diff changeset
256 }
fb3f3df002df first release
dwinter
parents:
diff changeset
257
fb3f3df002df first release
dwinter
parents:
diff changeset
258 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
259 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
260 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
261 }
fb3f3df002df first release
dwinter
parents:
diff changeset
262
fb3f3df002df first release
dwinter
parents:
diff changeset
263 // istit
fb3f3df002df first release
dwinter
parents:
diff changeset
264 try {
7
19e40abb3e8a bug in istit
dwinter
parents: 6
diff changeset
265 String istit = lexDoc.getValue(record, ".//istit");
19e40abb3e8a bug in istit
dwinter
parents: 6
diff changeset
266 if (!istit.equals("")){
0
fb3f3df002df first release
dwinter
parents:
diff changeset
267 OWLIndividual istitInd = owlDoc.getIndividualByReadableId(
fb3f3df002df first release
dwinter
parents:
diff changeset
268 "IndicesInstitutions", istit);
fb3f3df002df first release
dwinter
parents:
diff changeset
269 if (istitInd == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
270 istitInd = createOrGetInstitution(istit);
fb3f3df002df first release
dwinter
parents:
diff changeset
271 }
7
19e40abb3e8a bug in istit
dwinter
parents: 6
diff changeset
272
0
fb3f3df002df first release
dwinter
parents:
diff changeset
273
fb3f3df002df first release
dwinter
parents:
diff changeset
274 owlDoc.setProperty(eventInstance, "recordsDuomoObjectInstitution",
fb3f3df002df first release
dwinter
parents:
diff changeset
275 istitInd);
7
19e40abb3e8a bug in istit
dwinter
parents: 6
diff changeset
276 }
0
fb3f3df002df first release
dwinter
parents:
diff changeset
277
fb3f3df002df first release
dwinter
parents:
diff changeset
278 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
279 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
280 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
281 }
fb3f3df002df first release
dwinter
parents:
diff changeset
282
fb3f3df002df first release
dwinter
parents:
diff changeset
283 // types
fb3f3df002df first release
dwinter
parents:
diff changeset
284
fb3f3df002df first release
dwinter
parents:
diff changeset
285 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
286 List<Element> types = XPath.selectNodes(record, ".//type");
fb3f3df002df first release
dwinter
parents:
diff changeset
287 for (Element type : types) {
fb3f3df002df first release
dwinter
parents:
diff changeset
288 createType(eventInstance, type);
fb3f3df002df first release
dwinter
parents:
diff changeset
289 }
fb3f3df002df first release
dwinter
parents:
diff changeset
290 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
291 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
292 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
293 }
fb3f3df002df first release
dwinter
parents:
diff changeset
294
fb3f3df002df first release
dwinter
parents:
diff changeset
295 return eventInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
296 }
fb3f3df002df first release
dwinter
parents:
diff changeset
297
fb3f3df002df first release
dwinter
parents:
diff changeset
298 private void createType(OWLIndividual eventInstance, Element type) {
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
299
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
300
0
fb3f3df002df first release
dwinter
parents:
diff changeset
301 String typeId;
fb3f3df002df first release
dwinter
parents:
diff changeset
302 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
303 typeId = lexDoc.getValue(type, "./ptr/@target");
fb3f3df002df first release
dwinter
parents:
diff changeset
304 String clsName = owlDoc.getClassNameFromTypeId(typeId);
fb3f3df002df first release
dwinter
parents:
diff changeset
305 OWLIndividual typeInd = owlDoc.createInstance(clsName);
fb3f3df002df first release
dwinter
parents:
diff changeset
306
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
307 owlDoc.setProperty(eventInstance, "has_topic", typeInd);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
308 List<Element> freeTexts = XPath.selectNodes(type, "./freetext");
fb3f3df002df first release
dwinter
parents:
diff changeset
309 for (Element freeText : freeTexts) {
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
310 OWLNamedClass cls = owlDoc.getClassFromTypeId(typeId);
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
311
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
312 OWLNamedClass subjectClass = getPreferredTargetClass(cls,
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
313 "has_subject");
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
314 OWLNamedClass predicateClass = getPreferredTargetClass(cls,
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
315 "has_predicate");
0
fb3f3df002df first release
dwinter
parents:
diff changeset
316
fb3f3df002df first release
dwinter
parents:
diff changeset
317 String subjPointer = lexDoc.getValue(freeText,
fb3f3df002df first release
dwinter
parents:
diff changeset
318 "./sub/ptrtoperson/@target");
fb3f3df002df first release
dwinter
parents:
diff changeset
319 String subjText = lexDoc.getValue(freeText, "./sub");
fb3f3df002df first release
dwinter
parents:
diff changeset
320
fb3f3df002df first release
dwinter
parents:
diff changeset
321 OWLIndividual subjInd = createSubjectOrPredicate(subjectClass,
fb3f3df002df first release
dwinter
parents:
diff changeset
322 subjPointer, subjText);
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
323
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
324
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
325 //suche ob eine subpropery von materiaInvolved fuer die die zem Type (type) gehoerige Klasse (clsName) existiert
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
326 // und wenn ja welche, TODO: zur Zeit wird dann aus dem String "subjText" das entsprechende Material erzeugt.
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
327
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
328
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
329 //Collection<RDFProperty> props = cls.getPossibleRDFProperties();
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
330
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
331
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
332
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
333 RDFProperty superproperty= owlDoc.owlModel.getRDFProperty("http://ontologies.mpiwg-berlin.mpg.de/research/duomoAnalysis.owl/materialInvolved");
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
334
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
335 Collection<RDFSClass> sc = cls.getSuperclasses(true);
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
336
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
337 OWLNamedClass mat = owlDoc.owlModel.getOWLNamedClass("http://ontologies.mpiwg-berlin.mpg.de/research/duomoAnalysis.owl/DuomoActivities");
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
338
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
339 if (sc.contains(mat)){ // cls is subclass of DuomoActivities
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
340 Collection<RDFProperty> props = superproperty.getSubproperties(false);
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
341
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
342 //jetzt suche zu welcher subproperty die classe cls gehšrt
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
343
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
344 //dazu gehe durch alle subproperties von materialInvolved-
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
345 for (RDFProperty prop:props){
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
346
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
347 @SuppressWarnings("unchecked")
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
348 Collection<RDFSClass> domains = prop.getDomains(true);
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
349
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
350 for(RDFSClass domain: domains){
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
351 //if (domain.getName().equals(cls.getName()))
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
352
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
353 //suche jetzt die domaene zu diesen property in schaue ob die cls eine subklasse davon ist
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
354 if (cls.isSubclassOf(domain)) // cls ist in der domaene der property
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
355 {
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
356
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
357 //die propery muss genau einen wert aus einer festen klasse haben, diese wird jetzt gesucht und dann eine individual erzeugt.
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
358 Collection<AbstractOWLRestriction> restrictions = cls.getRestrictions(prop, false); // suche die restriction und erzeuge dann ein object dieses type
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
359 for (AbstractOWLRestriction restriction: restrictions){
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
360 if (DefaultOWLAllValuesFrom.class.isInstance(restriction)){
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
361 DefaultOWLAllValuesFrom rest = (DefaultOWLAllValuesFrom)restriction;
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
362 RDFResource restClass = rest.getAllValuesFrom();
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
363 OWLIndividual inst = owlDoc.createOrGetInstanceWithIdentifier(restClass.getLocalName(), "Identifier", subjText, false);
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
364 owlDoc.setProperty(typeInd, prop.getLocalName(), inst);
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
365 //materialInd = owlDoc.createInstance(res.getName());
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
366 }
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
367 }
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
368 }
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
369 }
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
370 }
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
371 }
0
fb3f3df002df first release
dwinter
parents:
diff changeset
372
fb3f3df002df first release
dwinter
parents:
diff changeset
373 String predPointer = lexDoc.getValue(freeText,
fb3f3df002df first release
dwinter
parents:
diff changeset
374 "./pred/ptrtoperson/@target");
fb3f3df002df first release
dwinter
parents:
diff changeset
375 String predText = lexDoc.getValue(freeText, "./pred");
fb3f3df002df first release
dwinter
parents:
diff changeset
376
fb3f3df002df first release
dwinter
parents:
diff changeset
377 OWLIndividual predInd = createSubjectOrPredicate(
fb3f3df002df first release
dwinter
parents:
diff changeset
378 predicateClass, predPointer, predText);
fb3f3df002df first release
dwinter
parents:
diff changeset
379
fb3f3df002df first release
dwinter
parents:
diff changeset
380 if (subjInd != null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
381 owlDoc.setProperty(typeInd, "has_subject", subjInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
382 }
fb3f3df002df first release
dwinter
parents:
diff changeset
383
fb3f3df002df first release
dwinter
parents:
diff changeset
384 if (predInd != null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
385 owlDoc.setProperty(typeInd, "has_predicate", predInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
386 }
fb3f3df002df first release
dwinter
parents:
diff changeset
387
fb3f3df002df first release
dwinter
parents:
diff changeset
388 owlDoc.setProperty(eventInstance, "recordsDuomoObjectConcept",
fb3f3df002df first release
dwinter
parents:
diff changeset
389 typeInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
390 }
fb3f3df002df first release
dwinter
parents:
diff changeset
391
fb3f3df002df first release
dwinter
parents:
diff changeset
392 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
393 // TODO Auto-generated catch block
fb3f3df002df first release
dwinter
parents:
diff changeset
394 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
395 }
fb3f3df002df first release
dwinter
parents:
diff changeset
396
fb3f3df002df first release
dwinter
parents:
diff changeset
397 }
fb3f3df002df first release
dwinter
parents:
diff changeset
398
fb3f3df002df first release
dwinter
parents:
diff changeset
399 private OWLIndividual createSubjectOrPredicate(OWLNamedClass toClass,
fb3f3df002df first release
dwinter
parents:
diff changeset
400 String subjPointer, String subjText) {
fb3f3df002df first release
dwinter
parents:
diff changeset
401 OWLIndividual subjInd = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
402
fb3f3df002df first release
dwinter
parents:
diff changeset
403 if (!subjPointer.equals("")) {
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
404 subjInd = owlDoc.createInstance(toClass.getName());
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
405 //subjInd = toClass.createOWLIndividual(null);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
406 OWLIndividual ind = individualIds.get(subjPointer);
fb3f3df002df first release
dwinter
parents:
diff changeset
407 if (ind == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
408 logger.debug("target ID does not exist:" + subjPointer);
1
dwinter
parents: 0
diff changeset
409 try {
dwinter
parents: 0
diff changeset
410 missing.write("target ID does not exist:" + subjPointer+"\n");
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
411 missing.flush();
1
dwinter
parents: 0
diff changeset
412 } catch (IOException e) {
dwinter
parents: 0
diff changeset
413 // TODO Auto-generated catch block
dwinter
parents: 0
diff changeset
414 e.printStackTrace();
dwinter
parents: 0
diff changeset
415 }
0
fb3f3df002df first release
dwinter
parents:
diff changeset
416 } else {
fb3f3df002df first release
dwinter
parents:
diff changeset
417 owlDoc.setProperty(subjInd, "has_NameOrRoleFromIndex", ind);
fb3f3df002df first release
dwinter
parents:
diff changeset
418 }
fb3f3df002df first release
dwinter
parents:
diff changeset
419 }
fb3f3df002df first release
dwinter
parents:
diff changeset
420
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
421 if (!subjText.equals("") & !subjText.equals(" ")) {
0
fb3f3df002df first release
dwinter
parents:
diff changeset
422 if (subjInd == null)
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
423 subjInd = owlDoc.createInstance(toClass.getName());
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
424 //subjInd = toClass.createOWLIndividual(null);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
425
fb3f3df002df first release
dwinter
parents:
diff changeset
426 OWLNamedClass idcls = owlDoc.owlModel
fb3f3df002df first release
dwinter
parents:
diff changeset
427 .getOWLNamedClass("Identifier"); // is die klasse selbst
fb3f3df002df first release
dwinter
parents:
diff changeset
428 // schon ein identifiert
fb3f3df002df first release
dwinter
parents:
diff changeset
429 if (toClass.getNamedSuperclasses(true).contains(idcls)) { // to
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
430 owlDoc.setProperty(subjInd, "rdfs:label", subjText);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
431 } else {
fb3f3df002df first release
dwinter
parents:
diff changeset
432
fb3f3df002df first release
dwinter
parents:
diff changeset
433 OWLIndividual ident = owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
434 .createInstance("IdentifierPredicateOrSubject");
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
435 owlDoc.setProperty(ident, "rdfs:label", subjText);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
436 owlDoc.setProperty(subjInd, "crm:P48_has_preferred_identifier",
fb3f3df002df first release
dwinter
parents:
diff changeset
437 ident);
fb3f3df002df first release
dwinter
parents:
diff changeset
438 }
fb3f3df002df first release
dwinter
parents:
diff changeset
439 }
fb3f3df002df first release
dwinter
parents:
diff changeset
440 return subjInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
441 }
fb3f3df002df first release
dwinter
parents:
diff changeset
442
fb3f3df002df first release
dwinter
parents:
diff changeset
443 private OWLNamedClass getPreferredTargetClass(OWLNamedClass cls,
fb3f3df002df first release
dwinter
parents:
diff changeset
444 String propertyName) {
fb3f3df002df first release
dwinter
parents:
diff changeset
445 RDFProperty prop = owlDoc.owlModel.getRDFProperty(propertyName);
fb3f3df002df first release
dwinter
parents:
diff changeset
446
fb3f3df002df first release
dwinter
parents:
diff changeset
447 // finde welche klasse als subject erlaubt ist
fb3f3df002df first release
dwinter
parents:
diff changeset
448 Collection<?> restrictions = cls.getRestrictions(prop, true);
fb3f3df002df first release
dwinter
parents:
diff changeset
449
fb3f3df002df first release
dwinter
parents:
diff changeset
450 RDFResource restrictionValues = prop.getRange(); // nimm erstmal den
fb3f3df002df first release
dwinter
parents:
diff changeset
451 // gesammten Range
fb3f3df002df first release
dwinter
parents:
diff changeset
452
fb3f3df002df first release
dwinter
parents:
diff changeset
453 // schaue jetzt nach ob eb es einschraenkungen gibt.
fb3f3df002df first release
dwinter
parents:
diff changeset
454 for (Iterator<?> it = restrictions.iterator(); it.hasNext();) {
fb3f3df002df first release
dwinter
parents:
diff changeset
455 Object restriction = it.next();
fb3f3df002df first release
dwinter
parents:
diff changeset
456 if (OWLAllValuesFrom.class.isInstance(restriction)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
457 OWLAllValuesFrom ar = (OWLAllValuesFrom) restriction;
fb3f3df002df first release
dwinter
parents:
diff changeset
458 restrictionValues = ar.getAllValuesFrom();
fb3f3df002df first release
dwinter
parents:
diff changeset
459 break;
fb3f3df002df first release
dwinter
parents:
diff changeset
460 }
fb3f3df002df first release
dwinter
parents:
diff changeset
461
fb3f3df002df first release
dwinter
parents:
diff changeset
462 }
fb3f3df002df first release
dwinter
parents:
diff changeset
463 OWLNamedClass toClass = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
464 if (OWLNamedClass.class.isInstance(restrictionValues)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
465 toClass = (OWLNamedClass) restrictionValues;
fb3f3df002df first release
dwinter
parents:
diff changeset
466 } else if (OWLDataRange.class.isInstance(restrictionValues)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
467 RDFList dr = ((OWLDataRange) restrictionValues).getOneOf();
fb3f3df002df first release
dwinter
parents:
diff changeset
468 for (Object d : dr.getValues()) {
fb3f3df002df first release
dwinter
parents:
diff changeset
469 System.out.println(d);
fb3f3df002df first release
dwinter
parents:
diff changeset
470 toClass = (OWLNamedClass) d;
fb3f3df002df first release
dwinter
parents:
diff changeset
471 // FIXME: geht das??
fb3f3df002df first release
dwinter
parents:
diff changeset
472 }
fb3f3df002df first release
dwinter
parents:
diff changeset
473 } else if (DefaultOWLUnionClass.class.isInstance(restrictionValues)) { // mehr
fb3f3df002df first release
dwinter
parents:
diff changeset
474 // als
fb3f3df002df first release
dwinter
parents:
diff changeset
475 // eine
fb3f3df002df first release
dwinter
parents:
diff changeset
476 // moeglich
fb3f3df002df first release
dwinter
parents:
diff changeset
477 DefaultOWLUnionClass ou = (DefaultOWLUnionClass) restrictionValues;
fb3f3df002df first release
dwinter
parents:
diff changeset
478 Set set = new HashSet();
fb3f3df002df first release
dwinter
parents:
diff changeset
479 ou.getNestedNamedClasses(set);
fb3f3df002df first release
dwinter
parents:
diff changeset
480
fb3f3df002df first release
dwinter
parents:
diff changeset
481 for (Iterator<?> it = set.iterator(); it.hasNext();) {
fb3f3df002df first release
dwinter
parents:
diff changeset
482 OWLNamedClass cl = (OWLNamedClass) it.next();
fb3f3df002df first release
dwinter
parents:
diff changeset
483 OWLNamedClass idcls = owlDoc.owlModel
fb3f3df002df first release
dwinter
parents:
diff changeset
484 .getOWLNamedClass("Identifier"); // nimm die Klasse die
fb3f3df002df first release
dwinter
parents:
diff changeset
485 // ein Identifier
fb3f3df002df first release
dwinter
parents:
diff changeset
486 // ist.
fb3f3df002df first release
dwinter
parents:
diff changeset
487 if (cl.getNamedSuperclasses(true).contains(idcls)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
488 toClass = cl;
fb3f3df002df first release
dwinter
parents:
diff changeset
489 break;
fb3f3df002df first release
dwinter
parents:
diff changeset
490 }
fb3f3df002df first release
dwinter
parents:
diff changeset
491
fb3f3df002df first release
dwinter
parents:
diff changeset
492 }
fb3f3df002df first release
dwinter
parents:
diff changeset
493 }
fb3f3df002df first release
dwinter
parents:
diff changeset
494 return toClass;
fb3f3df002df first release
dwinter
parents:
diff changeset
495 }
fb3f3df002df first release
dwinter
parents:
diff changeset
496
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
497
0
fb3f3df002df first release
dwinter
parents:
diff changeset
498
fb3f3df002df first release
dwinter
parents:
diff changeset
499 private OWLIndividual handleNameWithRole(OWLIndividual recordInd,
fb3f3df002df first release
dwinter
parents:
diff changeset
500 String name, String role) {
fb3f3df002df first release
dwinter
parents:
diff changeset
501 // teste ob schon ein solcer Eintrag existiert
fb3f3df002df first release
dwinter
parents:
diff changeset
502 OWLIndividual nameInd = owlDoc.getIndividualByReadableId(
fb3f3df002df first release
dwinter
parents:
diff changeset
503 "IndicesNames", name);
fb3f3df002df first release
dwinter
parents:
diff changeset
504 Boolean createNewNameWithRole = false;
fb3f3df002df first release
dwinter
parents:
diff changeset
505 if (nameInd == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
506 nameInd = createOrGetName(name);
fb3f3df002df first release
dwinter
parents:
diff changeset
507 createNewNameWithRole = true; // name existierte nicht dann kann
fb3f3df002df first release
dwinter
parents:
diff changeset
508 // auch NameWithRole nicht
fb3f3df002df first release
dwinter
parents:
diff changeset
509 // existierten.
fb3f3df002df first release
dwinter
parents:
diff changeset
510 }
fb3f3df002df first release
dwinter
parents:
diff changeset
511 OWLIndividual roleInd = owlDoc.getIndividualByReadableId(
fb3f3df002df first release
dwinter
parents:
diff changeset
512 "IndicesRoles", role);
fb3f3df002df first release
dwinter
parents:
diff changeset
513 if (roleInd == null) {
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
514 roleInd = createOrGetRole(role);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
515 createNewNameWithRole = true; // role existierte nicht dann kann
fb3f3df002df first release
dwinter
parents:
diff changeset
516 // auch NameWithRole nicht
fb3f3df002df first release
dwinter
parents:
diff changeset
517 // existierten.
fb3f3df002df first release
dwinter
parents:
diff changeset
518 }
fb3f3df002df first release
dwinter
parents:
diff changeset
519 OWLIndividual nameWithRoleInd = null;
fb3f3df002df first release
dwinter
parents:
diff changeset
520 if (!createNewNameWithRole) { // schon klar, dass er nicht existiert
fb3f3df002df first release
dwinter
parents:
diff changeset
521 nameWithRoleInd = getNameWithRole(nameInd, roleInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
522 }
fb3f3df002df first release
dwinter
parents:
diff changeset
523
fb3f3df002df first release
dwinter
parents:
diff changeset
524 if (nameWithRoleInd == null) { // existiert nicht
fb3f3df002df first release
dwinter
parents:
diff changeset
525 nameWithRoleInd = createNameWithRole(nameInd, roleInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
526 }
fb3f3df002df first release
dwinter
parents:
diff changeset
527
fb3f3df002df first release
dwinter
parents:
diff changeset
528 return nameWithRoleInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
529 }
fb3f3df002df first release
dwinter
parents:
diff changeset
530
fb3f3df002df first release
dwinter
parents:
diff changeset
531 private OWLIndividual getNameWithRole(OWLIndividual nameInd,
fb3f3df002df first release
dwinter
parents:
diff changeset
532 OWLIndividual roleInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
533 List<OWLIndividual> indicesWithNames = owlDoc.getIndividuals(
fb3f3df002df first release
dwinter
parents:
diff changeset
534 "IndicesNameWithRole", "refers_to_name", nameInd); // suche alle
fb3f3df002df first release
dwinter
parents:
diff changeset
535 // infrage
fb3f3df002df first release
dwinter
parents:
diff changeset
536 // kommenden
fb3f3df002df first release
dwinter
parents:
diff changeset
537 // nameen
fb3f3df002df first release
dwinter
parents:
diff changeset
538
fb3f3df002df first release
dwinter
parents:
diff changeset
539 if (indicesWithNames == null) { // kein Treffer
fb3f3df002df first release
dwinter
parents:
diff changeset
540 return null;
fb3f3df002df first release
dwinter
parents:
diff changeset
541 }
fb3f3df002df first release
dwinter
parents:
diff changeset
542
fb3f3df002df first release
dwinter
parents:
diff changeset
543 for (OWLIndividual name : indicesWithNames) {
fb3f3df002df first release
dwinter
parents:
diff changeset
544 Object role = owlDoc.getRelatedIndividual(name, "refers_to_role");
fb3f3df002df first release
dwinter
parents:
diff changeset
545 if (roleInd.equals(role)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
546 return name;
fb3f3df002df first release
dwinter
parents:
diff changeset
547 }
fb3f3df002df first release
dwinter
parents:
diff changeset
548 }
fb3f3df002df first release
dwinter
parents:
diff changeset
549 return null;
fb3f3df002df first release
dwinter
parents:
diff changeset
550 }
fb3f3df002df first release
dwinter
parents:
diff changeset
551
fb3f3df002df first release
dwinter
parents:
diff changeset
552 private OWLIndividual createOrGetTipol(String typology) {
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
553 OWLIndividual tipol = owlDoc.createOrGetInstanceWithIdentifier("Typology","Identifier",typology,false);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
554 return tipol;
fb3f3df002df first release
dwinter
parents:
diff changeset
555 }
fb3f3df002df first release
dwinter
parents:
diff changeset
556
fb3f3df002df first release
dwinter
parents:
diff changeset
557 private OWLIndividual createNameWithRole(OWLIndividual nameInd,
fb3f3df002df first release
dwinter
parents:
diff changeset
558 OWLIndividual roleInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
559
fb3f3df002df first release
dwinter
parents:
diff changeset
560 OWLIndividual nameWithRoleInd = owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
561 .createInstance("IndicesNameWithRole");
fb3f3df002df first release
dwinter
parents:
diff changeset
562
fb3f3df002df first release
dwinter
parents:
diff changeset
563 owlDoc.setProperty(nameWithRoleInd, "refers_to_name", nameInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
564 owlDoc.setProperty(nameWithRoleInd, "refers_to_role", roleInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
565
fb3f3df002df first release
dwinter
parents:
diff changeset
566 return nameWithRoleInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
567
fb3f3df002df first release
dwinter
parents:
diff changeset
568 }
fb3f3df002df first release
dwinter
parents:
diff changeset
569
fb3f3df002df first release
dwinter
parents:
diff changeset
570 private OWLIndividual createOrGetInstitution(String name) {
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
571 OWLIndividual nameInd = owlDoc.createOrGetInstanceWithIdentifier("IndicesInstitutions","IdentifierInstitutions",name,false);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
572
fb3f3df002df first release
dwinter
parents:
diff changeset
573 return nameInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
574 }
fb3f3df002df first release
dwinter
parents:
diff changeset
575
fb3f3df002df first release
dwinter
parents:
diff changeset
576 private OWLIndividual createOrGetName(String name) {
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
577 OWLIndividual nameInd = owlDoc.createOrGetInstanceWithIdentifier("IndicesNames","IdentifierNames",name,false);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
578 return nameInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
579 }
fb3f3df002df first release
dwinter
parents:
diff changeset
580
2
273164f81926 bug in transformer handleroles
dwinter
parents: 1
diff changeset
581 private OWLIndividual createOrGetRole(String name) {
5
923e73fa07f1 Minor changes, Suche nach Objekten nach readableId jetzt einschraenkbar, nicht auf subclassen ausweiten.
dwinter
parents: 4
diff changeset
582 OWLIndividual roleInd = owlDoc.createOrGetInstanceWithIdentifier("IndicesRoles","IdentifierRoles",name,false);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
583 return roleInd;
fb3f3df002df first release
dwinter
parents:
diff changeset
584 }
fb3f3df002df first release
dwinter
parents:
diff changeset
585
fb3f3df002df first release
dwinter
parents:
diff changeset
586 private OWLIndividual createRecord(Element record, OWLIndividual cardInd)
fb3f3df002df first release
dwinter
parents:
diff changeset
587 throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
588 OWLIndividual recordInstance = owlDoc.createInstance("Record");
fb3f3df002df first release
dwinter
parents:
diff changeset
589 owlDoc.setProperty(recordInstance, "is_on_card", cardInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
590 createNewDependingInstanceFromXpath(record, recordInstance, "./@id",
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
591 new String[] { "rdfs:label" },
0
fb3f3df002df first release
dwinter
parents:
diff changeset
592 "IdentifierCurrent", "crm:P48_has_preferred_identifier");
fb3f3df002df first release
dwinter
parents:
diff changeset
593
fb3f3df002df first release
dwinter
parents:
diff changeset
594 String value = lexDoc.getValue(record, ".//textblockid");
fb3f3df002df first release
dwinter
parents:
diff changeset
595 if (!value.equals(""))
fb3f3df002df first release
dwinter
parents:
diff changeset
596 owlDoc.setProperty(recordInstance, "has_textblockid", value);
fb3f3df002df first release
dwinter
parents:
diff changeset
597
fb3f3df002df first release
dwinter
parents:
diff changeset
598 String endOnCarta = lexDoc.getValue(record, "./@end_on_carta");
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
599
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
600 //FIXME: addRecordToCarta ist buggy. siehe dort! ausserdem wir nicht berŸcksichtig, dass zwischen
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
601 // card und end_on_carta mehr als eine liegen kann, zur Zeit wird nur die carta die in end_on_carta beschrieben wird zu
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
602 // record mittels is_on_card hinzugefŸgt.
0
fb3f3df002df first release
dwinter
parents:
diff changeset
603 if (!endOnCarta.equals("")) {
fb3f3df002df first release
dwinter
parents:
diff changeset
604 OWLIndividual signature = (OWLIndividual) owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
605 .getRelatedIndividual(cardInd, "has_signature");
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
606 addRecordToCarta(recordInstance, endOnCarta, signature);
0
fb3f3df002df first release
dwinter
parents:
diff changeset
607 }
fb3f3df002df first release
dwinter
parents:
diff changeset
608
fb3f3df002df first release
dwinter
parents:
diff changeset
609 String dateDcStart = lexDoc.getValue(record, ".//datdc/startdate");
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
610 String dateDcEnd = lexDoc.getValue(record, ".//datdc/enddate");
0
fb3f3df002df first release
dwinter
parents:
diff changeset
611
fb3f3df002df first release
dwinter
parents:
diff changeset
612 OWLIndividual timeSpan = owlDoc.createTimeSpan(dateDcStart, dateDcEnd);
fb3f3df002df first release
dwinter
parents:
diff changeset
613
fb3f3df002df first release
dwinter
parents:
diff changeset
614 owlDoc.setProperty(recordInstance, "crm:P4_has_time-span", timeSpan);
fb3f3df002df first release
dwinter
parents:
diff changeset
615
fb3f3df002df first release
dwinter
parents:
diff changeset
616 return recordInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
617 }
fb3f3df002df first release
dwinter
parents:
diff changeset
618
fb3f3df002df first release
dwinter
parents:
diff changeset
619 private void addRecordToCarta(OWLIndividual recordInstance, String cardID,
fb3f3df002df first release
dwinter
parents:
diff changeset
620 OWLIndividual signature) {
fb3f3df002df first release
dwinter
parents:
diff changeset
621
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
622 //FIXME: cartID ist nur innerhalb einer Signatur eindeutig, d.h. h, es muss die cardID gefunden werden die in der
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
623 // selben signatur lebt wir "signature"
0
fb3f3df002df first release
dwinter
parents:
diff changeset
624 OWLIndividual card = owlDoc.getIndividualByReadableId("Card", cardID);
fb3f3df002df first release
dwinter
parents:
diff changeset
625
fb3f3df002df first release
dwinter
parents:
diff changeset
626 if (card == null) {
fb3f3df002df first release
dwinter
parents:
diff changeset
627 card = createCard(cardID, signature);
fb3f3df002df first release
dwinter
parents:
diff changeset
628 }
fb3f3df002df first release
dwinter
parents:
diff changeset
629
fb3f3df002df first release
dwinter
parents:
diff changeset
630 owlDoc.setProperty(recordInstance, "is_on_card", card);
fb3f3df002df first release
dwinter
parents:
diff changeset
631 }
fb3f3df002df first release
dwinter
parents:
diff changeset
632
fb3f3df002df first release
dwinter
parents:
diff changeset
633 private OWLIndividual createSignature(Element signature)
fb3f3df002df first release
dwinter
parents:
diff changeset
634 throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
635 Element segHeaderElement = (Element) XPath.selectSingleNode(signature,
fb3f3df002df first release
dwinter
parents:
diff changeset
636 ".//segheader");
fb3f3df002df first release
dwinter
parents:
diff changeset
637 String segheader = segHeaderElement.getTextTrim();
fb3f3df002df first release
dwinter
parents:
diff changeset
638
fb3f3df002df first release
dwinter
parents:
diff changeset
639 OWLIndividual signatureInstance = owlDoc.createInstance("Signatur");
9
4392a6adf85a new version der label mit language tag
dwinter
parents: 8
diff changeset
640
4392a6adf85a new version der label mit language tag
dwinter
parents: 8
diff changeset
641
4392a6adf85a new version der label mit language tag
dwinter
parents: 8
diff changeset
642 OWLIndividual preferredId = owlDoc.createInstance("Identifier");
4392a6adf85a new version der label mit language tag
dwinter
parents: 8
diff changeset
643 owlDoc.setProperty(preferredId, "rdfs:label", segheader);
4392a6adf85a new version der label mit language tag
dwinter
parents: 8
diff changeset
644
4392a6adf85a new version der label mit language tag
dwinter
parents: 8
diff changeset
645 owlDoc.setProperty(signatureInstance, "crm:P48_has_preferred_identifier",
4392a6adf85a new version der label mit language tag
dwinter
parents: 8
diff changeset
646 preferredId);
4392a6adf85a new version der label mit language tag
dwinter
parents: 8
diff changeset
647
4392a6adf85a new version der label mit language tag
dwinter
parents: 8
diff changeset
648
0
fb3f3df002df first release
dwinter
parents:
diff changeset
649 return signatureInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
650 }
fb3f3df002df first release
dwinter
parents:
diff changeset
651
fb3f3df002df first release
dwinter
parents:
diff changeset
652 private OWLIndividual createCard(String cardId, OWLIndividual signature) {
fb3f3df002df first release
dwinter
parents:
diff changeset
653
fb3f3df002df first release
dwinter
parents:
diff changeset
654 OWLIndividual cardInstance = owlDoc.createInstance("Card");
fb3f3df002df first release
dwinter
parents:
diff changeset
655
fb3f3df002df first release
dwinter
parents:
diff changeset
656 owlDoc.setProperty(cardInstance, "has_signature", signature);
fb3f3df002df first release
dwinter
parents:
diff changeset
657
fb3f3df002df first release
dwinter
parents:
diff changeset
658 OWLIndividual preferredId = owlDoc.createInstance("IdentifierCurrent");
fb3f3df002df first release
dwinter
parents:
diff changeset
659 owlDoc.setProperty(preferredId, "rdfs:label", cardId);
fb3f3df002df first release
dwinter
parents:
diff changeset
660
fb3f3df002df first release
dwinter
parents:
diff changeset
661 owlDoc.setProperty(cardInstance, "crm:P48_has_preferred_identifier",
fb3f3df002df first release
dwinter
parents:
diff changeset
662 preferredId);
fb3f3df002df first release
dwinter
parents:
diff changeset
663
fb3f3df002df first release
dwinter
parents:
diff changeset
664 return cardInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
665 }
fb3f3df002df first release
dwinter
parents:
diff changeset
666
fb3f3df002df first release
dwinter
parents:
diff changeset
667 private OWLIndividual createCard(Element card, OWLIndividual signatureInd) {
fb3f3df002df first release
dwinter
parents:
diff changeset
668
fb3f3df002df first release
dwinter
parents:
diff changeset
669 OWLIndividual cardInstance = owlDoc.createInstance("Card");
fb3f3df002df first release
dwinter
parents:
diff changeset
670
fb3f3df002df first release
dwinter
parents:
diff changeset
671 try {
fb3f3df002df first release
dwinter
parents:
diff changeset
672
fb3f3df002df first release
dwinter
parents:
diff changeset
673 createNewDependingInstanceFromXpath(card, cardInstance,
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
674 ".//cartanr", new String[] { "rdfs:label" }, "IdentifierCurrent",
0
fb3f3df002df first release
dwinter
parents:
diff changeset
675 "crm:P48_has_preferred_identifier");
fb3f3df002df first release
dwinter
parents:
diff changeset
676
fb3f3df002df first release
dwinter
parents:
diff changeset
677 createNewDependingInstanceFromXpath(card, cardInstance,
8
919e9f3b5efd neue klassen zur textanalyse (stanford parser eingebaut)
dwinter
parents: 7
diff changeset
678 ".//cartaant", new String[] { "rdfs:label" }, "IdentifierCurrent",
0
fb3f3df002df first release
dwinter
parents:
diff changeset
679 "crm:P1_is_identified_by");
fb3f3df002df first release
dwinter
parents:
diff changeset
680
fb3f3df002df first release
dwinter
parents:
diff changeset
681 owlDoc.setProperty(cardInstance, "has_signature", signatureInd);
fb3f3df002df first release
dwinter
parents:
diff changeset
682
fb3f3df002df first release
dwinter
parents:
diff changeset
683 } catch (JDOMException e) {
fb3f3df002df first release
dwinter
parents:
diff changeset
684 e.printStackTrace();
fb3f3df002df first release
dwinter
parents:
diff changeset
685 return null;
fb3f3df002df first release
dwinter
parents:
diff changeset
686 }
fb3f3df002df first release
dwinter
parents:
diff changeset
687
fb3f3df002df first release
dwinter
parents:
diff changeset
688 return cardInstance;
fb3f3df002df first release
dwinter
parents:
diff changeset
689 }
fb3f3df002df first release
dwinter
parents:
diff changeset
690
fb3f3df002df first release
dwinter
parents:
diff changeset
691 private void createNewDependingInstanceFromXpath(Element card,
fb3f3df002df first release
dwinter
parents:
diff changeset
692 OWLIndividual cardInstance, String xpath, String[] propertyNames,
fb3f3df002df first release
dwinter
parents:
diff changeset
693 String newInstanceClassName, String relationNameToNewInstance)
fb3f3df002df first release
dwinter
parents:
diff changeset
694 throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
695
fb3f3df002df first release
dwinter
parents:
diff changeset
696 List<?> identifierIdEls = (List<?>) XPath.selectNodes(card, xpath);
fb3f3df002df first release
dwinter
parents:
diff changeset
697 for (Object identifierIdEl : identifierIdEls) {
fb3f3df002df first release
dwinter
parents:
diff changeset
698 String identifierId = "";
fb3f3df002df first release
dwinter
parents:
diff changeset
699 if (Element.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
700 identifierId = ((Element) identifierIdEl).getTextTrim();
fb3f3df002df first release
dwinter
parents:
diff changeset
701 } else if (Attribute.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
702 identifierId = ((Attribute) identifierIdEl).getValue();
fb3f3df002df first release
dwinter
parents:
diff changeset
703 }
fb3f3df002df first release
dwinter
parents:
diff changeset
704
fb3f3df002df first release
dwinter
parents:
diff changeset
705 OWLIndividual identifier = owlDoc
fb3f3df002df first release
dwinter
parents:
diff changeset
706 .createInstance(newInstanceClassName);
fb3f3df002df first release
dwinter
parents:
diff changeset
707 for (int i = 0; i < propertyNames.length; i++) {
fb3f3df002df first release
dwinter
parents:
diff changeset
708 owlDoc.setProperty(identifier, propertyNames[i], identifierId);
fb3f3df002df first release
dwinter
parents:
diff changeset
709 }
fb3f3df002df first release
dwinter
parents:
diff changeset
710
fb3f3df002df first release
dwinter
parents:
diff changeset
711 owlDoc.setProperty(cardInstance, relationNameToNewInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
712 identifier);
fb3f3df002df first release
dwinter
parents:
diff changeset
713 }
fb3f3df002df first release
dwinter
parents:
diff changeset
714
fb3f3df002df first release
dwinter
parents:
diff changeset
715 }
fb3f3df002df first release
dwinter
parents:
diff changeset
716
fb3f3df002df first release
dwinter
parents:
diff changeset
717 // createNewDependingDataTypePropertyFromXpath(record, eventInstance,
fb3f3df002df first release
dwinter
parents:
diff changeset
718 // ".//resges/italian", "has_reges",
fb3f3df002df first release
dwinter
parents:
diff changeset
719 // "italian");
fb3f3df002df first release
dwinter
parents:
diff changeset
720 private void createNewDependingDataTypePropertyFromXpath(Element record,
fb3f3df002df first release
dwinter
parents:
diff changeset
721 OWLIndividual eventInstance, String xpath, String propertyName,
fb3f3df002df first release
dwinter
parents:
diff changeset
722 String lang) throws JDOMException {
fb3f3df002df first release
dwinter
parents:
diff changeset
723
fb3f3df002df first release
dwinter
parents:
diff changeset
724 List<?> identifierIdEls = (List<?>) XPath.selectNodes(record, xpath);
fb3f3df002df first release
dwinter
parents:
diff changeset
725 for (Object identifierIdEl : identifierIdEls) {
fb3f3df002df first release
dwinter
parents:
diff changeset
726 String identifierId = "";
fb3f3df002df first release
dwinter
parents:
diff changeset
727 if (Element.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
728 identifierId = ((Element) identifierIdEl).getTextTrim();
fb3f3df002df first release
dwinter
parents:
diff changeset
729 } else if (Attribute.class.isInstance(identifierIdEl)) {
fb3f3df002df first release
dwinter
parents:
diff changeset
730 identifierId = ((Attribute) identifierIdEl).getValue();
fb3f3df002df first release
dwinter
parents:
diff changeset
731 }
fb3f3df002df first release
dwinter
parents:
diff changeset
732
fb3f3df002df first release
dwinter
parents:
diff changeset
733 owlDoc.setDataTypePropery(eventInstance, propertyName,
fb3f3df002df first release
dwinter
parents:
diff changeset
734 identifierId, lang);
fb3f3df002df first release
dwinter
parents:
diff changeset
735 }
fb3f3df002df first release
dwinter
parents:
diff changeset
736 }
fb3f3df002df first release
dwinter
parents:
diff changeset
737 }