diff src/de/mpiwg/itgroup/eSciDoc/harvesting/ESciDocDataHarvester.java @ 10:ad5c0748bd08

minor
author dwinter
date Mon, 20 Aug 2012 12:53:45 +0200
parents b6cf6462d709
children
line wrap: on
line diff
--- a/src/de/mpiwg/itgroup/eSciDoc/harvesting/ESciDocDataHarvester.java	Thu Jun 21 09:46:26 2012 +0200
+++ b/src/de/mpiwg/itgroup/eSciDoc/harvesting/ESciDocDataHarvester.java	Mon Aug 20 12:53:45 2012 +0200
@@ -240,9 +240,10 @@
 					// TODO write PID to back to echo-obj
 					Boolean result = connector.createItem(escidocItem);
 					if (result) {
-						addedObjects.add(escidocItem.getESciDocId());
-						addedFile.debug(escidocItem.getESciDocId() + "\n");
-
+						String objID=escidocItem.getESciDocId();
+						addedObjects.add(objID);
+						addedFile.debug(objID + "\n");
+						((ECHORessource)obj).writeEsciDocIDToIndexMeta(objID.replace("/ir/item/",""));
 					} else {
 						notAddedObjects.add(obj.echoUrl);
 						notAddedFile.debug(obj.echoUrl);
@@ -344,7 +345,7 @@
 		Integer numberOfHits = connector.getNumberOfHitsFromFilterResult(
 				command, objectXPath,mode);
 
-
+		logger.info(String.format("%s objects found.", numberOfHits));
 		int tausend = ((numberOfHits-1) / MAX_REC);
 
 		String queryRestrict="";
@@ -353,7 +354,7 @@
 		} else {
 			queryRestrict="query=%22/properties/version/status%22=submitted";
 		}
-
+		int counter=0;
 		for (int t = 0; t <= tausend; t++) {
 			int start = t * MAX_REC+1;
 			// int max=Math.min((t+1)*1000, numberOfHits);
@@ -362,6 +363,9 @@
 			for (eSciDocXmlObject obj : connector
 					.getObjectsFromFilterResult(command+query, objectXPath)) {
 
+				logger.info(String.format("%s/%s", counter,numberOfHits));
+				counter+=1;
+				
 				//TODO is the following really necessary, currently the obj in the list is sometimes not the current one.
 				try{
 					HttpResponse resObj = connector.eScidocGet(obj.getESciDocId());
@@ -436,7 +440,7 @@
 				new ECHOTransformer(), connector, "/ir/context/escidoc:1001");
 
 		// hv.readObjectsFromInstance("ECHO_collection");
-		hv.readObjectsFromInstance("ECHO_resource");
+		//hv.readObjectsFromInstance("ECHO_resource");
 
 		hv.releaseAndSubmitObjects(
 				"/ir/context/escidoc:1001/resources/members",