+ private static void checkTreatmentAvailable(Map<String, List<String>> documents, Map<String, List<String>> docs)
+ throws IOException, MalformedURLException {
+ List<String> docList;
+ String inputLine;
+ for (String docId:documents.keySet()){
+ URL url = new URL(plaziUrlDoc+docId);
+ BufferedReader in = new BufferedReader(new InputStreamReader(url.openStream()));
+ while ((inputLine = in.readLine()) != null) {
+ if (inputLine.startsWith("<treatment ")){
+ String taxon = inputLine.split("taxon=\"")[1].split("\"")[0];
+ String docID=inputLine.split("docId=\"")[1].split("\"")[0];
+ String link=inputLine.split("link=\"")[1].split("\"")[0];
+ String pageStart = inputLine.split("startPage=\"")[1].split("\"")[0];
+ String pageEnd = inputLine.split("endPage=\"")[1].split("\"")[0];
+ docList = documents.get(docID);
+ if (docList == null) {
+ docList = new ArrayList<String>();
+ }
+ docList.add(pageStart+"---" + pageEnd + "---" + taxon + "---"+link);
+ docs.put(docID,docList);
+ }
+ }
+ }
+ }
+
+ private static Map<String, List<String>> fillDocumentMap(FilterType filterType,
+ String[] filterList, String urlstr)
+ throws MalformedURLException, IOException {
+
+ Map<String, List<String>> documents = new HashMap<String, List<String>>();
+ List<String> docList;
+ String inputLine;
+ for(String filter : filterList){
+ // plaziUrl=plaziUrl+"Eupolybothrus";
+ if (filterType == FilterType.MODS) {
+ urlstr=plaziUrlDoc + filter;
+ }else if (filterType == FilterType.TAXON) {
+ urlstr=plaziUrl + filter;
+ }
+ log.info("URLstr: " + urlstr);
+
+ URL plaziURL = new URL(urlstr);
+ BufferedReader in = new BufferedReader(new InputStreamReader(plaziURL.openStream()));
+
+
+ //TODO lastUpdate field
+ // if(!plaziNotServer){
+ while ((inputLine = in.readLine()) != null) {
+ System.out.println(inputLine);
+ if (inputLine.startsWith("<treatment ")){
+ String taxon = inputLine.split("taxon=\"")[1].split("\"")[0];
+ String docID=inputLine.split("docId=\"")[1].split("\"")[0];
+ System.out.println("docID: "+docID);
+
+ String link=inputLine.split("link=\"")[1].split("\"")[0];
+ String pageStart = inputLine.split("startPage=\"")[1].split("\"")[0];
+ String pageEnd = inputLine.split("endPage=\"")[1].split("\"")[0];
+ docList = documents.get(docID);
+ if (docList == null) {
+ docList = new ArrayList<String>();
+ }
+ docList.add(pageStart+"---" + pageEnd + "---"+taxon+"---"+link);
+ documents.put(docID,docList);
+ }
+ }
+ }
+ System.out.println("documents created");
+
+ return documents;
+ }
+