/src/edu/ucsb/nceas/metacat/harvesterClient/HarvestDocument.java - Metacat - Ecoinformatics Redmine

metacat/src/edu/ucsb/nceas/metacat/harvesterClient/HarvestDocument.java @ 2022

       /*
        * HarvestDocument.java
+       *
        * Created on January 14, 2004, 4:37 PM
        */
       package edu.ucsb.nceas.metacat.harvesterClient;
       import java.io.InputStream;
       import java.io.InputStreamReader;
       import java.io.IOException;
       import java.io.StringReader;
       import java.net.MalformedURLException;
       import java.net.URL;
       import edu.ucsb.nceas.metacat.client.*;
       import edu.ucsb.nceas.utilities.IOUtil;
       /**
        * HarvestDocument manages operations and data for a single document to be
        * harvested.
+       *
        * @author  costa
        */
       public class HarvestDocument {
         private String documentName;
         private String documentType;
         private String documentURL;
         private Harvester harvester;
         private HarvestSiteSchedule harvestSiteSchedule;
         private int identifier;
         private int revision;
         private String scope;
         /**
          * Creates a new instance of HarvestDocument. Initialized with the data
          * that was read from a single <document> element in site document list.
+         *
          * @param harvester            the parent Harvester object
          * @param harvestSiteSchedule  the parent HarvestSiteSchedule object
          * @param scope                the value of the <scope> element
          * @param identifier           the value of the <identifier> element
          * @param revision             the value of the <revision> element
          * @param documentType         the value of the <documentType> element
          * @param documentURL          the value of the <documentURL> element
          */
         public HarvestDocument(
                                 Harvester harvester,
                                 HarvestSiteSchedule harvestSiteSchedule,
                                 String scope,
                                 int identifier,
                                 int revision,
                                 String documentType,
                                 String documentURL
                               ) {
           this.harvester = harvester;
           this.harvestSiteSchedule = harvestSiteSchedule;
           this.documentType = documentType;
           this.documentURL = documentURL;
           this.scope = scope;
           this.identifier = identifier;
           this.revision = revision;
           this.documentName = scope + "." + identifier;
+        }
         /**
          * Retrieve the document from the site using its <documentURL> value.
+         *
          * @return   A StringReader containing the document string.
          */
         private StringReader getSiteDocument() {
           String documentString;
           InputStream inputStream;
           InputStreamReader inputStreamReader;
           StringReader stringReader = null;
           URL url;
           try {
             url = new URL(documentURL);
             inputStream = url.openStream();
             inputStreamReader = new InputStreamReader(inputStream);
             documentString = IOUtil.getAsString(inputStreamReader, true);
             stringReader = new StringReader(documentString);
             System.out.println("  Successfully read document: " + documentURL);
+          }
           catch (MalformedURLException e) {
             System.err.println("MalformedURLException: " + e.getMessage());
+          }
           catch (IOException e) {
             System.err.println("IOException: " + e.getMessage());
+          }
           return stringReader;
+        }
         /**
          * Harvest the document from the site. Unless Metacat already has the
          * document, retrieve the document from the site and put (insert or
          * update) it to Metacat. If Metacat already has the document, determine
          * the highest revision stored in Metacat so that this can be reported
          * back to the user.
          */
         public void harvestDocument() {
           int highestRevision;
           String metacatReturnString;
           StringReader stringReader;
           /* If metacat already has this document, determine the highest revision in
            * metacat and report it to the user; else, insert or delete the document
            * into metacat.
            */
           if (metacatHasDocument()) {
             System.out.println("  metacat has document");
             highestRevision = metacatHighestRevision();
             System.out.println("  metacatHighestRevision: " + highestRevision);
+          }
           else {
             stringReader = getSiteDocument();
             if (stringReader != null) {
               if (parseDocument()) {
                 metacatReturnString = putMetacatDocument(stringReader);
                 System.out.println("  " + metacatReturnString);
+              }
               else {
                 System.out.println("Error parsing document.");
+              }
+            }
             else {
               System.out.print("  Error reading document at URL: ");
               System.out.println(documentURL);
+            }
+          }
+        }
         /**
          * Boolean to determine whether Metacat already has this document.
+         *
          * @return  true if Metacat has the document, otherwise false
          */
         private boolean metacatHasDocument() {
           boolean     hasDocument = false;
           return hasDocument;
+        }
         /**
          * Determines the highest revision that Metacat has for this document.
+         *
          * @return  int representing the highest revision for this document in Metacat
          */
         private int metacatHighestRevision() {
           int         highestRevision = 0;
           return highestRevision;
+        }
         /**
          * Parse the document to determine whether it is valid EML prior to inserting
          * or updating it to Metacat. This is QA/QC measure. Currently unimplemented.
+         *
          * @return  true if the document is valid EML, otherwise false
          */
         private boolean parseDocument () {
           boolean success = true;
           return success;
+        }
         /**
          * Print the data fields and values in this HarvestDocument object.
          */
         void printOutput()
+        {
           System.out.println("");
           System.out.println("  scope: " + scope);
           System.out.println("  identifier: " + identifier);
           System.out.println("  revision: " + revision);
           System.out.println("  documentType: " + documentType);
           System.out.println("  documentURL: " + documentURL);
           System.out.println("  documentName: " + documentName);
+        }
         /**
          * Insert or update this document to Metacat. If revision equals 1, do an
          * insert; otherwise, do an update.
+         *
          * @return  the Metacat return string from the insert or update operation
          */
         private String putMetacatDocument(StringReader stringReader) {
           String docid = scope + "." + identifier + "." + revision;
           Metacat metacat = harvester.metacat;
           String metacatReturnString = "";
           if (harvester.connectToMetacat()) {
             try {
               if (revision == 1) {
                 System.out.println("  Inserting document to metacat: " + docid);
                 metacatReturnString = metacat.insert(docid, stringReader, null);
+              }
               else {
                 System.out.println("  Updating document to metacat: " + docid);
                 metacatReturnString = metacat.update(docid, stringReader, null);
+              }
+            }
             catch (MetacatInaccessibleException e) {
               System.err.println("MetacatInaccessibleException: " + e.getMessage());
+            }
             catch (InsufficientKarmaException e) {
               System.err.println("InsufficientKarmaException: " + e.getMessage());
+            }
             catch (MetacatException e) {
               System.err.println("MetacatException: " + e.getMessage());
+            }
             catch (IOException e) {
               System.err.println("IOException: " + e.getMessage());
+            }
+          }
           else {
             metacatReturnString = "Not putting document to metacat";
+          }
           return metacatReturnString;
+        }
+      }

(2-2/7)

Project

General

Profile

Metacat