Project

General

Profile

« Previous | Next » 

Revision 471

Added by bojilova over 24 years ago

Separate thread used for writing into xml_index table.
This cut the time of the response on insert almost in half.
The tread is started afterwards
(on end of document parsing and inserting into xml_nodes) from
DBSAXHandler and uses new(separate) db connection.
But I did not find a good way to show the work done of that thread.

View differences:

src/edu/ucsb/nceas/metacat/DBSAXHandler.java
16 16

  
17 17
import java.sql.*;
18 18
import java.util.Stack;
19
import java.util.Vector;
20
import java.util.Enumeration;
19 21
import java.util.EmptyStackException;
20 22

  
21 23
import org.xml.sax.Attributes;
......
30 32
 * call when processing the XML stream and generating events
31 33
 */
32 34
public class DBSAXHandler extends DefaultHandler 
33
                          implements LexicalHandler, DeclHandler {
35
                          implements LexicalHandler, DeclHandler, Runnable {
34 36

  
35 37
   private boolean	atFirstElement;
36 38
   private boolean	processingDTD;
......
38 40
   private String 	doctype;
39 41
   private String 	systemid;
40 42
   private boolean 	stackCreated = false;
41
   private Stack 	nodeStack;
42
   private Connection	conn = null;
43
   private Stack 	  nodeStack;
44
   private Vector   nodeIndex;
45
   private Connection	  conn = null;
43 46
   private DocumentImpl currentDocument;
44 47
   private DBSAXNode    rootNode;
45
   private String       action = null;
46
   private String       docid = null;
47
   private String       user = null;
48
   private String   action = null;
49
   private String   docid = null;
50
   private String   user = null;
51
   private Thread   xmlIndex;
52
   private boolean endDocument = false;
48 53

  
49 54
   private static final int MAXDATACHARS = 4000;
50 55
   private static final int MAXTITLELEN = 1000;
......
62 67
     // if it doesn't already exist
63 68
     if (!stackCreated) {
64 69
       nodeStack = new Stack();
70
       nodeIndex = new Vector();
65 71
       stackCreated = true;
66 72
     }
67 73
   }
......
79 85
     this.action = action;
80 86
     this.docid = docid;
81 87
     this.user = user;
88
     this.xmlIndex = new Thread(this);
89
     //this.xmlIndex.setPriority(Thread.MIN_PRIORITY);
82 90
   }
83 91

  
84 92
   /** SAX Handler that receives notification of beginning of the document */
......
94 102

  
95 103
   /** SAX Handler that receives notification of end of the document */
96 104
   public void endDocument() throws SAXException {
97
// NOT NEEDED ANY MORE - use currentDocument.setTitle() from characters(cbuf,start,end)
98
//     currentDocument.setTitleFromChildElement();
99 105
     MetaCatUtil.debugMessage("end Document");
100
// NOT NEEDED ANY MORE - Accession# is generated at the very beginning before the parsing
101
//     if ((docid != null) && (!docid.equals(currentDocument.getDocID()))) {
102
//       throw (new SAXException("New document ID generated:",
103
//           new AccessionNumberGeneratedException(currentDocument.getDocID())));
104
//     } else {
105
//       throw (new SAXException("New document ID generated:",
106
//           new AccessionNumberGeneratedException(currentDocument.getDocID())));
107
//     }
106
     // Starting new thread for writing XML Index.
107
     // It calls the run method of the thread.
108
     try {
109
       xmlIndex.start();
110
     } catch (NullPointerException e) {
111
       xmlIndex = null;
112
       throw new 
113
       SAXException("Problem with starting thread for writing XML Index. " +
114
                    e.getMessage());
115
     }
108 116
   }
109 117

  
110 118
   /** SAX Handler that is called at the start of each XML element */
......
151 159
     currentNode = new DBSAXNode(conn, localName, parentNode,
152 160
                                 currentDocument.getRootNodeID(),docid,
153 161
                                 currentDocument.getDoctype());
154
                                 
162
                               
155 163
     // Add all of the attributes
156 164
     for (int i=0; i<atts.getLength(); i++) {
157 165
       currentNode.setAttribute(atts.getLocalName(i), atts.getValue(i), docid);
......
160 168
     // Add the node to the stack, so that any text data can be 
161 169
     // added as it is encountered
162 170
     nodeStack.push(currentNode);
171
     // Add the node to the vector used by thread for writing XML Index
172
     nodeIndex.addElement(currentNode);
173

  
163 174
  }
175
  
176
  // The run method of xmlIndex thread. It writes XML Index for the document.
177
  public void run () {
178
    DBSAXNode currNode = null;
179
    DBSAXNode prevNode = null;
180
    int step = 0;
181
    int counter = 0;
164 182

  
183
    try {
184
      // Opening separate db connection for writing XML Index
185
      MetaCatUtil util = new MetaCatUtil();
186
      Connection conn = util.getConnection();
187
      conn.setAutoCommit(false);
188

  
189
      // Going through the elements of the document and writing its Index
190
      Enumeration nodes = nodeIndex.elements();
191
      while ( nodes.hasMoreElements() ) {
192
        currNode = (DBSAXNode)nodes.nextElement();
193
        currNode.updateNodeIndex(conn, docid, currentDocument.getDoctype());
194
      }
195
    
196
      conn.commit();
197
      conn.close();
198
    
199
    } catch (Exception e) {
200
      try {
201
        conn.rollback();
202
        conn.close();
203
      } catch (SQLException sqle) {}
204
      System.out.println("Error writing XML Index. " + e.getMessage()); 
205
    }      
206
  }
207

  
165 208
  /** SAX Handler that is called for each XML text node */
166 209
  public void characters(char[] cbuf, int start, int len) throws SAXException {
167 210
     MetaCatUtil.debugMessage("CHARACTERS");
src/edu/ucsb/nceas/metacat/DBSAXNode.java
60 60
    this.conn = conn;
61 61
    this.parentNode = parentNode;
62 62
    writeChildNodeToDB("ELEMENT", getTagName(), null, docid);
63
    updateNodeIndex(docid, doctype);
63
    //No writing XML Index from here. New Thread used instead.
64
    //updateNodeIndex(docid, doctype);
64 65
  }
65 66
    
66 67
  /** creates SQL code and inserts new node into DB connection */
......
159 160
      }
160 161
  }
161 162

  
162
  /** 
163
   * creates SQL code to put doc ID for the document node and for 
164
   * comment/PI nodes under document node into DB connection 
165
   */
166
/*  
167
  public void writeDocID(String doc_id) {
168
      try {
169
        PreparedStatement pstmt;
170
        pstmt = conn.prepareStatement(
171
              "UPDATE xml_nodes set docid = ? " +
172
              "WHERE nodeid = ?");
173

  
174
        // Bind the values to the query
175
        pstmt.setString(1, doc_id);
176
        pstmt.setLong(2, getNodeID());
177
        // Do the insertion
178
        pstmt.execute();
179
        pstmt.close();
180

  
181
        // for comments and PI on the top
182
        pstmt = conn.prepareStatement(
183
              "UPDATE xml_nodes set docid = ? " +
184
              "WHERE parentnodeid = ?");
185
        // Bind the values to the query
186
        pstmt.setString(1, doc_id);
187
        pstmt.setLong(2, getNodeID());
188
        // Do the insertion
189
        pstmt.execute();
190
        pstmt.close();
191
      } catch (SQLException e) {
192
        System.out.println(e.getMessage());
193
      }   
194
  }
195
*/
196 163
  /** get next node id from DB connection */
197 164
  private long generateNodeID() throws SAXException {
198 165
      long nid=0;
......
230 197
  }
231 198

  
232 199
  /** 
200
   * NOT USED
233 201
   * Update the node index (xml_index) for this node by generating
234 202
   * test strings that represent all of the relative and absolute
235 203
   * paths through the XML tree from document root to this node
......
285 253
      pstmt.setLong(5, getParentID());
286 254
      
287 255
      // Step through the hashtable and insert each of the path values
256
      Enumeration en = pathlist.keys();
257
      while (en.hasMoreElements()) {
258
        String path = (String)en.nextElement();
259
        Long nodeid = (Long)pathlist.get(path);
260
        pstmt.setLong(1, nodeid.longValue());
261
        pstmt.setString(2, path);
262
        pstmt.executeUpdate();
263
  
264
        //System.out.println(nodeid + " ==> " + path);
265
      }
266

  
267
      // Close the database statement
268
      pstmt.close();
269
    } catch (SQLException sqe) {
270
      System.err.println("SQL Exception while inserting path to index.");
271
      System.err.println(sqe.getMessage());
272
      throw new SAXException(sqe.getMessage());
273
    }
274
  }
275

  
276
  /** 
277
   * USED FROM SEPARATE THREAD RUNNED from DBSAXHandler on endDocument()
278
   * Update the node index (xml_index) for this node by generating
279
   * test strings that represent all of the relative and absolute
280
   * paths through the XML tree from document root to this node
281
   */
282
  public void updateNodeIndex(Connection conn, String docid, String doctype) 
283
               throws SAXException
284
  {
285
    Hashtable pathlist = new Hashtable();
286
    boolean atStartingNode = true;
287
    boolean atRootDocumentNode = false;
288
    DBSAXNode nodePointer = this;
289
    StringBuffer currentPath = new StringBuffer();
290
    int counter = 0;
291

  
292
    // Create a Hashtable of all of the paths to reach this node
293
    // including absolute paths and relative paths
294
    while (!atRootDocumentNode) {
295
      if (atStartingNode) {
296
        currentPath.insert(0, nodePointer.getTagName());
297
        pathlist.put(currentPath.toString(), new Long(getNodeID()));
298
        counter++;
299
        atStartingNode = false;
300
      } else {
301
        currentPath.insert(0, "/");
302
        currentPath.insert(0, nodePointer.getTagName());
303
        pathlist.put(currentPath.toString(), new Long(getNodeID()));
304
        counter++;
305
      }
306

  
307
      // advance to the next parent node
308
      nodePointer = nodePointer.getParentNode();
309

  
310
      // If we're at the DOCUMENT node (root of DOM tree), add
311
      // the root "/" to make the absolute path
312
      if (nodePointer.getNodeType().equals("DOCUMENT")) {
313
        currentPath.insert(0, "/");
314
        pathlist.put(currentPath.toString(), new Long(getNodeID()));
315
        counter++;
316
        atRootDocumentNode = true;
317
      } 
318
    }
319

  
320
    try {
321
      // Create an insert statement to reuse for all of the path insertions
322
      PreparedStatement pstmt = conn.prepareStatement(
323
              "INSERT INTO xml_index (nodeid, path, docid, doctype, " + 
324
               "parentnodeid) " + 
325
              "VALUES (?, ?, ?, ?, ?)");
326
      ((OraclePreparedStatement)pstmt).setExecuteBatch(counter);
327
  
328
      pstmt.setString(3, docid);
329
      pstmt.setString(4, doctype);
330
      pstmt.setLong(5, getParentID());
331
      
332
      // Step through the hashtable and insert each of the path values
288 333
      Enumeration en = pathlist.keys();
289 334
      while (en.hasMoreElements()) {
290 335
        String path = (String)en.nextElement();

Also available in: Unified diff