Package org.apache.abdera.parser.stax

Source Code of org.apache.abdera.parser.stax.FOMParser

/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements.  The ASF licenses this file to You
* under the Apache License, Version 2.0 (the "License"); you may not
* use this file except in compliance with the License.
* You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.  For additional information regarding
* copyright in this work, please see the NOTICE file in the top level
* directory of this distribution.
*/
package org.apache.abdera.parser.stax;

import java.io.InputStream;
import java.io.Reader;

import javax.xml.stream.XMLInputFactory;
import javax.xml.stream.XMLStreamException;
import javax.xml.stream.XMLStreamReader;

import org.apache.abdera.Abdera;
import org.apache.abdera.factory.Factory;
import org.apache.abdera.i18n.iri.IRI;
import org.apache.abdera.i18n.text.Localizer;
import org.apache.abdera.i18n.text.io.CompressionUtil;
import org.apache.abdera.model.Document;
import org.apache.abdera.model.Element;
import org.apache.abdera.parser.ParseException;
import org.apache.abdera.parser.Parser;
import org.apache.abdera.parser.ParserOptions;
import org.apache.abdera.parser.stax.util.FOMSniffingInputStream;
import org.apache.abdera.parser.stax.util.FOMXmlRestrictedCharReader;
import org.apache.abdera.util.AbstractParser;
import org.apache.axiom.om.OMDocument;
import org.apache.axiom.om.util.StAXUtils;

public class FOMParser
  extends AbstractParser
  implements Parser {

  public FOMParser() {
    super();
  }
 
  public FOMParser(Abdera abdera) {
    super(abdera);
  }
 
  private FOMFactory getFomFactory(ParserOptions options) {
    FOMFactory factory =
      (options != null && options.getFactory() != null) ?
        (FOMFactory)options.getFactory() : null;
    if (factory == null) {
      Factory f = getFactory();
      factory = (f instanceof FOMFactory) ?
        (FOMFactory)f : new FOMFactory();
    }
    return factory;
  }
 
  private <T extends Element>Document<T> getDocument(
    FOMBuilder builder,
    IRI base,
    ParserOptions options)
      throws ParseException {
    Document<T> document = builder.getFomDocument();
    try {
      if (base != null)
        document.setBaseUri(base.toString());
      if (options != null && options.getCharset() != null)
        ((OMDocument)document).setCharsetEncoding(options.getCharset());
      if (options != null) document.setMustPreserveWhitespace(options.getMustPreserveWhitespace());
    } catch (Exception e) {
      if (!(e instanceof ParseException))
        e = new ParseException(e);
      throw (ParseException)e;
    }
    return document;
  }
   
  public <T extends Element>Document<T> parse(
    InputStream in,
    String base,
    ParserOptions options)
      throws ParseException {
    if (in == null)
      throw new IllegalArgumentException(Localizer.get("INPUTSTREAM.NOT.NULL"));
    try {
      if (options == null) options = getDefaultParserOptions();
      if (options.getCompressionCodecs() != null) {
        in = CompressionUtil.getDecodingInputStream(
          in, options.getCompressionCodecs());
      }
      String charset = options.getCharset();
      if (charset == null && options.getAutodetectCharset()) {
        FOMSniffingInputStream sin =
          (in instanceof FOMSniffingInputStream) ?
            (FOMSniffingInputStream)in :
            new FOMSniffingInputStream(in);
        charset = sin.getEncoding();
        if (charset != null) options.setCharset(charset);
        in = sin;
      }
      if (options.getFilterRestrictedCharacters()) {
        Reader rdr = (charset == null) ?
          new FOMXmlRestrictedCharReader(
            in,options.getFilterRestrictedCharacterReplacement()) :
          new FOMXmlRestrictedCharReader(
            in,charset,options.getFilterRestrictedCharacterReplacement());
        return parse(StAXUtils.createXMLStreamReader(rdr), base, options);
      } else {
        XMLStreamReader xmlreader = (charset == null) ?
          createXMLStreamReader(in) :
          createXMLStreamReader(in, charset);
        return parse(xmlreader, base, options);
      }
    } catch (Exception e) {
      if (!(e instanceof ParseException))
        e = new ParseException(e);
      throw (ParseException)e;
    }
  }

  public <T extends Element> Document<T> parse(
    Reader in,
    String base,
    ParserOptions options)
      throws ParseException {
    if (in == null)
      throw new IllegalArgumentException(Localizer.get("READER.NOT.NULL"));
    try {
      if (options == null) options = getDefaultParserOptions();
      if (options.getFilterRestrictedCharacters() &&
          !(in instanceof FOMXmlRestrictedCharReader)) {
        in = new FOMXmlRestrictedCharReader(
          in,options.getFilterRestrictedCharacterReplacement());
      }
      //return parse(StAXUtils.createXMLStreamReader(in), base, options);
      return parse(createXMLStreamReader(in), base, options);
    } catch (Exception e) {
      if (!(e instanceof ParseException))
        e = new ParseException(e);
      throw (ParseException)e;
    }
  }

  private static XMLInputFactory getXMLInputFactory() {
    XMLInputFactory inputFactory = StAXUtils.getXMLInputFactory();
    //inputFactory.setProperty(XMLInputFactory.IS_REPLACING_ENTITY_REFERENCES, Boolean.FALSE);
    return inputFactory;
  }
 
  private static void releaseXMLInputFactory(XMLInputFactory inputFactory) {
    StAXUtils.releaseXMLInputFactory(inputFactory);
  }
 
  public static XMLStreamReader createXMLStreamReader(
    InputStream in,
    String encoding)
      throws XMLStreamException {
    XMLInputFactory inputFactory = getXMLInputFactory();
    try {
      return inputFactory.createXMLStreamReader(in, encoding);
    } finally {
      releaseXMLInputFactory(inputFactory);
    }
  }

  public static XMLStreamReader createXMLStreamReader(
    InputStream in)
      throws XMLStreamException {
    XMLInputFactory inputFactory = getXMLInputFactory();
    try {
      return inputFactory.createXMLStreamReader(in);
    } finally {
      releaseXMLInputFactory(inputFactory);
    }
  }
 
  private XMLStreamReader createXMLStreamReader(Reader in) throws XMLStreamException {
    XMLInputFactory inputFactory = getXMLInputFactory();
    try {   
      XMLStreamReader reader = inputFactory.createXMLStreamReader(in);
      return reader;
    } finally {
      releaseXMLInputFactory(inputFactory);
    }   
  }
 
  private <T extends Element> Document<T> parse(
    XMLStreamReader reader,
    String base,
    ParserOptions options)
      throws ParseException {
    try {
      FOMBuilder builder =
        new FOMBuilder(
          getFomFactory(options),
          reader,
          options);
      return getDocument(builder, base != null ? new IRI(base) : null, options);
    } catch (Exception e) {
      if (!(e instanceof ParseException))
        e = new ParseException(e);
      throw (ParseException)e;
    }
  }

  @Override
  protected ParserOptions initDefaultParserOptions() {
    return new FOMParserOptions(getFactory());
  }

}
TOP

Related Classes of org.apache.abdera.parser.stax.FOMParser

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.