All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.thaiopensource.relaxng.parse.compact.CompactParseable Maven / Gradle / Ivy

Go to download

Jing is a validator for RELAX NG and other schema languages. This project was taken from http://code.google.com/p/jing-trang and mavenized for inclusion in the Wicket Stuff HTML Validator. The code was taken from the 20091111 release.

There is a newer version: 1.11
Show newest version
package com.thaiopensource.relaxng.parse.compact;

import com.thaiopensource.relaxng.parse.Annotations;
import com.thaiopensource.relaxng.parse.BuildException;
import com.thaiopensource.relaxng.parse.CommentList;
import com.thaiopensource.relaxng.parse.IllegalSchemaException;
import com.thaiopensource.relaxng.parse.IncludedGrammar;
import com.thaiopensource.relaxng.parse.SchemaBuilder;
import com.thaiopensource.relaxng.parse.Scope;
import com.thaiopensource.relaxng.parse.SubParseable;
import com.thaiopensource.resolver.Identifier;
import com.thaiopensource.resolver.Input;
import com.thaiopensource.resolver.MediaTypedIdentifier;
import com.thaiopensource.resolver.Resolver;
import com.thaiopensource.resolver.ResolverException;
import com.thaiopensource.util.Uri;
import com.thaiopensource.xml.util.EncodingMap;
import org.xml.sax.ErrorHandler;

import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.io.PushbackInputStream;
import java.io.Reader;

public class CompactParseable, A extends Annotations>
        implements SubParseable {
  private final Input in;
  private final Resolver resolver;
  private final ErrorHandler eh;
  private static final String MEDIA_TYPE = "application/relax-ng-compact-syntax";

  public CompactParseable(Input in, Resolver resolver, ErrorHandler eh) {
    this.in = in;
    this.resolver = resolver;
    this.eh = eh;
  }

  public P parse(SchemaBuilder sb, Scope scope) throws BuildException, IllegalSchemaException {
    return new CompactSyntax(makeReader(in), in.getUri(), sb, eh).parse(scope);
  }

  public SubParseable createSubParseable(String href, String base) throws BuildException {
    Identifier id = new MediaTypedIdentifier(href, base, MEDIA_TYPE);
    Input input = new Input();
    try {
      resolver.resolve(id, input);
    }
    catch (ResolverException e) {
      throw BuildException.fromResolverException(e);
    }
    catch (IOException e) {
      throw new BuildException(e);
    }
    return new CompactParseable(input, resolver, eh);
  }

  public P parseAsInclude(SchemaBuilder sb, IncludedGrammar g)
          throws BuildException, IllegalSchemaException {
    return new CompactSyntax(makeReader(in), in.getUri(), sb, eh).parseInclude(g);
  }

  public String getUri() {
    String uri = in.getUri();
    if (uri == null)
      return null;
    return Uri.escapeDisallowedChars(uri);
  }

  private static final String UTF8 = EncodingMap.getJavaName("UTF-8");
  private static final String UTF16 = EncodingMap.getJavaName("UTF-16");

  private Reader makeReader(Input in) throws BuildException {
    try {
      resolver.open(in);
      Reader reader = in.getCharacterStream();
      if (reader == null) {
        InputStream byteStream = in.getByteStream();
        if (byteStream == null)
          throw new IllegalArgumentException("invalid input for CompactParseable");
        String encoding = in.getEncoding();
        if (encoding == null) {
          PushbackInputStream pb = new PushbackInputStream(byteStream, 2);
          encoding = detectEncoding(pb);
          byteStream = pb;
        }
        reader = new InputStreamReader(byteStream, encoding);
      }
      return reader;
    }
    catch (ResolverException e) {
      throw BuildException.fromResolverException(e);
    }
    catch (IOException e) {
      throw new BuildException(e);
    }
  }

  static private String detectEncoding(PushbackInputStream in) throws IOException {
    String encoding = UTF8;
    int b1 = in.read();
    if (b1 != -1) {
      int b2 = in.read();
      if (b2 != -1) {
        in.unread(b2);
        if ((b1 == 0xFF && b2 == 0xFE) || (b1 == 0xFE && b2 == 0xFF))
          encoding = UTF16;
      }
      in.unread(b1);
    }
    return encoding;
  }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy