OASIS Mailing List ArchivesView the OASIS mailing list archive below
or browse/search using MarkMail.

 


Help: OASIS Mailing Lists Help | MarkMail Help

docbook-tc message

[Date Prev] | [Thread Prev] | [Thread Next] | [Date Next] -- [Date Index] | [Thread Index] | [List Home]


Subject: Re: [docbook-tc] 5.0b1 test test release


/ Jirka Kosek <jirka@kosek.cz> was heard to say:
| The only pity is that you can't specify schema name as a parameter, so
| there must be xsi:schemaLocation inside document pointing to schema.

Oh, that's just intolerable. Here's an extension of the resolver's
xread application that accepts a list of XSD files with a -S option.
You only have to list the XSDs, it peeks inside to find the target
namespaces (because the schemas are self-identifying for crying out
loud!)

// xjparse.java - A simple command-line XML parser

/* Derived from org.apache.xml.resolver.apps.xread
 * Copyright 2001-2004 The Apache Software Foundation or its licensors,
 * as applicable.
 */

package com.nwalsh.parsers;

import java.io.FileNotFoundException;
import java.io.IOException;
import java.util.Date;
import java.util.Enumeration;
import java.util.Hashtable;
import java.util.StringTokenizer;
import java.util.Vector;

import org.xml.sax.SAXException;

//import org.xml.sax.helpers.*;

import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.parsers.DocumentBuilder;
import javax.xml.parsers.ParserConfigurationException;

import org.apache.xml.resolver.tools.ResolvingXMLReader;
import org.apache.xml.resolver.Catalog;
import org.apache.xml.resolver.CatalogManager;
import org.apache.xml.resolver.helpers.Debug;
import org.apache.xml.resolver.apps.XParseError;

import org.w3c.dom.Document;
import org.w3c.dom.Element;

/**
 * A simple command-line XML parsing application.
 *
 * <p>This class implements a simple command-line XML Parser. It's
 * just a little wrapper around the JAXP XMLReader with support for
 * catalogs.
 * </p>
 *
 * <p>Usage: xjparse [options] document.xml</p>
 *
 * <p>Where:</p>
 *
 * <dl>
 * <dt><code>-c</code> <em>catalogfile</em></dt>
 * <dd>Load a particular catalog file.</dd>
 * <dt><code>-w</code></dt>
 * <dd>Perform a well-formed parse, not a validating parse.</dd>
 * <dt><code>-v</code> (the default)</dt>
 * <dd>Perform a validating parse.</dd>
 * <dt><code>-s</code></dt>
 * <dd>Enable W3C XML Schema validation.</dd>
 * <dt><code>-n</code></dt>
 * <dd>Perform a namespace-ignorant parse.</dd>
 * <dt><code>-N</code> (the default)</dt>
 * <dd>Perform a namespace-aware parse.</dd>
 * <dt><code>-d</code> <em>integer</em></dt>
 * <dd>Set the debug level. Warnings are shown if the debug level
 * is &gt; 2.</dd>
 * <dt><code>-E</code> <em>integer</em></dt>
 * <dd>Set the maximum number of errors to display.</dd>
 * </dl>
 *
 * <p>The process ends with error-level 1, if there errors.</p>
 *
 * @see org.apache.xml.resolver.tools.ResolvingXMLReader
 *
 * @author Norman Walsh
 * <a href="mailto:Norman.Walsh@Sun.COM";>Norman.Walsh@Sun.COM</a>
 *
 * @version 1.0
 */
public class xjparse {
    private static Debug debug = CatalogManager.getStaticManager().debug;

    protected static final String SCHEMA_VALIDATION_FEATURE_ID
	= "http://apache.org/xml/features/validation/schema";;

    protected static final String SCHEMA_FULL_CHECKING_FEATURE_ID
	= "http://apache.org/xml/features/validation/schema-full-checking";;

    protected static final String EXTERNAL_SCHEMA_LOCATION_PROPERTY_ID
	= "http://apache.org/xml/properties/schema/external-schemaLocation";;

    protected static final String EXTERNAL_NONS_SCHEMA_LOCATION_PROPERTY_ID
	= "http://apache.org/xml/properties/schema/external-noNamespaceSchemaLocation";;

  /** The main entry point */
  public static void main (String[] args)
    throws FileNotFoundException, IOException {

    String  xmlfile    = null;
    int     debuglevel = 0;
    int     maxErrs    = 10;
    boolean nsAware    = true;
    boolean validating = true;
    boolean useSchema  = false;
    boolean showWarnings = (debuglevel > 2);
    boolean showErrors = true;
    boolean fullChecking = false; // true implies useSchema
    Hashtable schemaList = null; // non-null implies useSchema
    Vector catalogFiles = new Vector();

    for (int i=0; i<args.length; i++) {
      if (args[i].equals("-c")) {
	++i;
	catalogFiles.add(args[i]);
	continue;
      }

      if (args[i].equals("-w")) {
	validating = false;
	continue;
      }

      if (args[i].equals("-v")) {
	validating = true;
	continue;
      }

      if (args[i].equals("-s")) {
	useSchema = true;
	continue;
      }

      if (args[i].equals("-S")) {
	++i;
	schemaList = lookupSchemas(args[i]);
	useSchema = true;
	continue;
      }

      if (args[i].equals("-f")) {
	fullChecking = true;
	useSchema = true;
	continue;
      }

      if (args[i].equals("-n")) {
	nsAware = false;
	continue;
      }

      if (args[i].equals("-N")) {
	nsAware = true;
	continue;
      }

      if (args[i].equals("-d")) {
	++i;
	String debugstr = args[i];
	try {
	  debuglevel = Integer.parseInt(debugstr);
	  if (debuglevel >= 0) {
	    debug.setDebug(debuglevel);
	    showWarnings = (debuglevel > 2);
	  }
	} catch (Exception e) {
	  // nop
	}
	continue;
      }

      if (args[i].equals("-E")) {
	++i;
	String errstr = args[i];
	try {
	  int errs = Integer.parseInt(errstr);
	  if (errs >= 0) {
	    maxErrs = errs;
	  }
	} catch (Exception e) {
	  // nop
	}
	continue;
      }

      xmlfile = args[i];
    }

    if (xmlfile == null) {
      System.out.println("Usage: org.apache.xml.resolver.apps.xjparse [opts] xmlfile");
      System.exit(1);
    }

    ResolvingXMLReader reader = new ResolvingXMLReader();

    try {
      reader.setFeature("http://xml.org/sax/features/namespaces";, nsAware);
      reader.setFeature("http://xml.org/sax/features/validation";, validating);
      if (useSchema) {
	  reader.setFeature(SCHEMA_VALIDATION_FEATURE_ID, useSchema);
	  reader.setFeature(SCHEMA_FULL_CHECKING_FEATURE_ID, fullChecking);
	  if (schemaList != null) {
	      String slh = "";
	      String nons_slh = "";
	      Enumeration nskey = schemaList.keys();
	      while (nskey.hasMoreElements()) {
		  String ns = (String) nskey.nextElement();
		  String xsd = (String) schemaList.get(ns);
		  if ("".equals(ns)) {
		      nons_slh = xsd;
		  } else {
		      if (!"".equals(slh)) {
			  slh = slh + " ";
		      }
		      slh = slh + ns + " " + xsd;
		  }
	      }

	      if (!"".equals(slh)) {
		  reader.setProperty(EXTERNAL_SCHEMA_LOCATION_PROPERTY_ID,
				     slh);
	      }

	      if (!"".equals(nons_slh)) {
		  reader.setProperty(EXTERNAL_NONS_SCHEMA_LOCATION_PROPERTY_ID,
				     nons_slh);
	      }
	  }
      }
    } catch (SAXException e) {
      // nop;
    }

    Catalog catalog = reader.getCatalog();

    for (int count = 0; count < catalogFiles.size(); count++) {
      String file = (String) catalogFiles.elementAt(count);
      catalog.parseCatalog(file);
    }

    XParseError xpe = new XParseError(showErrors, showWarnings);
    xpe.setMaxMessages(maxErrs);
    reader.setErrorHandler(xpe);

    String parseType = validating ? "validating" : "well-formed";
    String nsType = nsAware ? "namespace-aware" : "namespace-ignorant";
    if (maxErrs > 0) {
      System.out.println("Attempting "
			 + parseType
			 + ", "
			 + nsType
			 + " parse");
    }

    Date startTime = new Date();

    try {
      reader.parse(xmlfile);
    } catch (SAXException sx) {
      System.out.println("SAX Exception: " + sx);
    } catch (Exception e) {
      e.printStackTrace();
    }

    Date endTime = new Date();

    long millisec = endTime.getTime() - startTime.getTime();
    long secs = 0;
    long mins = 0;
    long hours = 0;

    if (millisec > 1000) {
      secs = millisec / 1000;
      millisec = millisec % 1000;
    }

    if (secs > 60) {
      mins = secs / 60;
      secs = secs % 60;
    }

    if (mins > 60) {
      hours = mins / 60;
      mins = mins % 60;
    }

    if (maxErrs > 0) {
      System.out.print("Parse ");
      if (xpe.getFatalCount() > 0) {
	System.out.print("failed ");
      } else {
	System.out.print("succeeded ");
	System.out.print("(");
	if (hours > 0) {
	  System.out.print(hours + ":");
	}
	if (hours > 0 || mins > 0) {
	  System.out.print(mins + ":");
	}
	System.out.print(secs + "." + millisec);
	System.out.print(") ");
      }
      System.out.print("with ");

      int errCount = xpe.getErrorCount();
      int warnCount = xpe.getWarningCount();

      if (errCount > 0) {
	System.out.print(errCount + " error");
	System.out.print(errCount > 1 ? "s" : "");
	System.out.print(" and ");
      } else {
	System.out.print("no errors and ");
      }

      if (warnCount > 0) {
	System.out.print(warnCount + " warning");
	System.out.print(warnCount > 1 ? "s" : "");
	System.out.print(".");
      } else {
	System.out.print("no warnings.");
      }

      System.out.println("");
    }

    if (xpe.getErrorCount() > 0) {
      System.exit(1);
    }
  }

    private static Hashtable lookupSchemas(String schemaLocs) {
	Hashtable mapping = new Hashtable();

	try {
	    DocumentBuilderFactory dbf = DocumentBuilderFactory.newInstance();
	    dbf.setIgnoringComments(true);
	    dbf.setNamespaceAware(true);
	    dbf.setValidating(false);
	    DocumentBuilder db = dbf.newDocumentBuilder();

	    StringTokenizer tokenizer = new StringTokenizer(schemaLocs);
	    while (tokenizer.hasMoreTokens()) {
		String xsd = tokenizer.nextToken();
		Document doc = db.parse(xsd);
		Element s = doc.getDocumentElement();
		String targetNS = s.getAttribute("targetNamespace");
		if (targetNS == null || "".equals(targetNS)) {
		    mapping.put("", xsd);
		} else {
		    mapping.put(targetNS, xsd);
		}
	    }
	} catch (ParserConfigurationException pce) {
	    pce.printStackTrace();
	} catch (SAXException se) {
	    se.printStackTrace();
	} catch (IOException ioe) {
	    ioe.printStackTrace();
	}

	return mapping;
    }
}



                                        Be seeing you,
                                          norm

-- 
Norman Walsh <ndw@nwalsh.com>      | The happiest people seem to be
http://www.oasis-open.org/docbook/ | those that have no particular
Chair, DocBook Technical Committee | reason for being happy except that
                                   | they are so.--W. R. Inge

PGP signature



[Date Prev] | [Thread Prev] | [Thread Next] | [Date Next] -- [Date Index] | [Thread Index] | [List Home]