annotate src/de/mpiwg/itgroup/eSciDoc/harvesting/FoxridgeHarvester.java @ 15:e0efd3a9d2f0

changes for escidoc1.4
author dwinter
date Mon, 17 Sep 2012 10:21:04 +0200
parents ad5c0748bd08
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
c6929e63b0b8 first import
dwinter
parents:
diff changeset
1 package de.mpiwg.itgroup.eSciDoc.harvesting;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
2
c6929e63b0b8 first import
dwinter
parents:
diff changeset
3 import java.io.File;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
4 import java.net.MalformedURLException;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
5 import java.net.URL;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
6
c6929e63b0b8 first import
dwinter
parents:
diff changeset
7 import org.apache.log4j.BasicConfigurator;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
8 import org.apache.log4j.Level;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
9 import org.apache.log4j.Logger;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
10 import org.apache.log4j.xml.DOMConfigurator;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
11
c6929e63b0b8 first import
dwinter
parents:
diff changeset
12 import de.mpiwg.itgroup.eSciDoc.Tools.EScidocBasicHandler;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
13 import de.mpiwg.itgroup.eSciDoc.foxridge.IndexMetaIterator;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
14 import de.mpiwg.itgroup.eSciDoc.importer.ECHOImporter;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
15 import de.mpiwg.itgroup.eSciDoc.importer.FoxridgeImporter;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
16 import de.mpiwg.itgroup.eSciDoc.transformer.ECHOTransformer;
c6929e63b0b8 first import
dwinter
parents:
diff changeset
17
3
58b52df9763c added update functionality if index.meta has changed
dwinter
parents: 2
diff changeset
18 public class FoxridgeHarvester {
0
c6929e63b0b8 first import
dwinter
parents:
diff changeset
19
c6929e63b0b8 first import
dwinter
parents:
diff changeset
20 /**
c6929e63b0b8 first import
dwinter
parents:
diff changeset
21 * @param args
c6929e63b0b8 first import
dwinter
parents:
diff changeset
22 * @throws Exception
c6929e63b0b8 first import
dwinter
parents:
diff changeset
23 */
c6929e63b0b8 first import
dwinter
parents:
diff changeset
24 public static void main(String[] args) throws Exception {
c6929e63b0b8 first import
dwinter
parents:
diff changeset
25
7
df8c62d84f8f logfile conf changed in foxridge harvester
dwinter
parents: 6
diff changeset
26 DOMConfigurator.configure("/etc/escidocImportConfig.xml");
0
c6929e63b0b8 first import
dwinter
parents:
diff changeset
27 Logger rl = Logger.getRootLogger();
c6929e63b0b8 first import
dwinter
parents:
diff changeset
28 Logger.getLogger("transformerLogger").setLevel(Level.DEBUG);
c6929e63b0b8 first import
dwinter
parents:
diff changeset
29 Logger.getLogger("addedFilesLogger").setLevel(Level.DEBUG);
c6929e63b0b8 first import
dwinter
parents:
diff changeset
30 Logger.getLogger("notAddedFilesLogger").setLevel(Level.DEBUG);
c6929e63b0b8 first import
dwinter
parents:
diff changeset
31
10
dwinter
parents: 9
diff changeset
32 rl.setLevel(Level.INFO);
0
c6929e63b0b8 first import
dwinter
parents:
diff changeset
33
8
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
34 if (args.length<4){
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
35 System.out.println("Usage: harvest username password path context.");
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
36 System.out.println("eg: harvest username password /mpiwg/online/permanent/einstein/annalen /ir/context/escidoc:12001");
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
37 System.exit(0);
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
38
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
39 }
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
40
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
41 String username = args[0];
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
42 String pw = args[1];
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
43 String path = args[2];
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
44 String context = args[3];
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
45
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
46
0
c6929e63b0b8 first import
dwinter
parents:
diff changeset
47 //IndexMetaIterator sd = new IndexMetaIterator(new File("/Volumes/online_permanent/echo"));
c6929e63b0b8 first import
dwinter
parents:
diff changeset
48 //while (sd.hasNext()){
c6929e63b0b8 first import
dwinter
parents:
diff changeset
49 // System.out.println(sd.next());
c6929e63b0b8 first import
dwinter
parents:
diff changeset
50 //}
15
e0efd3a9d2f0 changes for escidoc1.4
dwinter
parents: 10
diff changeset
51 EScidocBasicHandler connector = new EScidocBasicHandler("escidoc-mpiwg.rz-berlin.mpg.de",8080,username,pw);
0
c6929e63b0b8 first import
dwinter
parents:
diff changeset
52
8
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
53 //ESciDocDataHarvester hv = new ESciDocDataHarvester(new FoxridgeImporter(new File("/Volumes/online_permanent/")),
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
54 // new ECHOTransformer(),connector,"/ir/context/escidoc:12001");
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
55
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
56 ESciDocDataHarvester hv = new ESciDocDataHarvester(new FoxridgeImporter(new File(path)),
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
57 new ECHOTransformer(),connector,context);
a844f6948dd8 ?nderungen im Walker
dwinter
parents: 7
diff changeset
58
0
c6929e63b0b8 first import
dwinter
parents:
diff changeset
59
c6929e63b0b8 first import
dwinter
parents:
diff changeset
60 //hv.readObjectsFromInstance("ECHO_collection");
10
dwinter
parents: 9
diff changeset
61 //hv.readObjectsFromInstance("ECHO_resource");
0
c6929e63b0b8 first import
dwinter
parents:
diff changeset
62
c6929e63b0b8 first import
dwinter
parents:
diff changeset
63 //hv.releaseAndSubmitObjects("/ir/context/escidoc:12001");
10
dwinter
parents: 9
diff changeset
64 //hv.releaseAndSubmitObjects(context+"/resources/members","//escidocItem:item","added esidoc test id",0);
15
e0efd3a9d2f0 changes for escidoc1.4
dwinter
parents: 10
diff changeset
65 hv.releaseAndSubmitObjects(context+"/resources/members","//escidocItem:item","first run",1);
0
c6929e63b0b8 first import
dwinter
parents:
diff changeset
66
c6929e63b0b8 first import
dwinter
parents:
diff changeset
67
c6929e63b0b8 first import
dwinter
parents:
diff changeset
68 }
c6929e63b0b8 first import
dwinter
parents:
diff changeset
69
c6929e63b0b8 first import
dwinter
parents:
diff changeset
70 }