org.htmlparser.scanners.ResourceScanner Maven / Gradle / Ivy
/**
* Copyright 2008 biaoping.yin
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.htmlparser.scanners;
import java.util.ArrayList;
import java.util.List;
import org.htmlparser.Attribute;
import org.htmlparser.Node;
import org.htmlparser.Tag;
import org.htmlparser.lexer.Lexer;
import org.htmlparser.util.NodeList;
import org.htmlparser.util.ParserException;
/**
* Title: ResourceScanner.java
*
* Description:
*
* Copyright: Copyright (c) 2007
*
* bboss workgroup
* @Date 2013-9-24
* @author biaoping.yin
* @version 1.0
*/
public class ResourceScanner extends CompositeTagScanner
{
/**
* Create a style scanner.
*/
public ResourceScanner ()
{
}
private boolean inIds(String tagname,String[] ids)
{
for(String id:ids)
{
if(tagname.equals(id))
return true;
}
return false;
}
/**
* Scan for style definitions.
* Accumulates text from the page, until </[a-zA-Z] is encountered.
* @param tag The tag this scanner is responsible for.
* @param lexer The source of CDATA.
* @param stack The parse stack, not used.
*/
public Tag scan (Tag tag, Lexer lexer, NodeList stack)
throws ParserException
{
String tagname = tag.getTagName();
int len = tagname.length();
Node content;
int position;
Node node;
Attribute attribute;
List vector;
// content = lexer.parseCDATA ();
content = lexer.parseCDATA ();
// content = lexer.parseCompositeCDATA_(false, tagname.toLowerCase() + "]", len);
position = lexer.getPosition ();
node = lexer.nextNode (false);
if (null != node)
if (!(node instanceof Tag) || !( ((Tag)node).isEndTag ()
&& ((Tag)node).getTagName ().equals (tagname)))
{
lexer.setPosition (position);
node = null;
}
// build new end tag if required
if (null == node)
{
attribute = new Attribute ("/" + tagname.toLowerCase(), null);
vector = new ArrayList ();
vector.add (attribute);
node = lexer.getNodeFactory ().createTagNode (
lexer.getPage (), position, position, vector);
}
tag.setEndTag ((Tag)node);
if (null != content)
{
tag.setChildren (new NodeList (content));
content.setParent (tag);
}
node.setParent (tag);
tag.doSemanticAction ();
return (tag);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy