Merge pull request #321 in CORE/base-third from ~HUGH.C/base-third:bugfix/10.0 to bugfix/10.0

* commit '4f71896be84d6e4264e5a03c94e5bea252180598': REPORT-25253 Html无法解析小于号
5 years ago · 7869153cf7
2 changed files with 32 additions and 7 deletions
--- a/fine-itext/src/com/fr/third/v2/lowagie/text/html/simpleparser/HTMLWorker.java
+++ b/fine-itext/src/com/fr/third/v2/lowagie/text/html/simpleparser/HTMLWorker.java
@ -804,10 +804,15 @@ public class HTMLWorker implements SimpleXMLDocHandler, DocListener {
 	public static final HashMap tagsSupported = new HashMap();
 	public static final HashMap tagsPrefixSupported = new HashMap();
 	static {
 		StringTokenizer tok = new StringTokenizer(tagsSupportedString);
-		while (tok.hasMoreTokens())
+		while (tok.hasMoreTokens()){
-			tagsSupported.put(tok.nextToken(), null);
+			String s = tok.nextToken();
 			tagsSupported.put(s, null);
 			tagsPrefixSupported.put(s.charAt(0), null);
 		}
 	}
 }
--- a/fine-itext/src/com/fr/third/v2/lowagie/text/xml/simpleparser/SimpleXMLParser.java
+++ b/fine-itext/src/com/fr/third/v2/lowagie/text/xml/simpleparser/SimpleXMLParser.java
@ -75,6 +75,8 @@
 */
 package com.fr.third.v2.lowagie.text.xml.simpleparser;
 import com.fr.third.v2.lowagie.text.html.simpleparser.HTMLWorker;
 import java.io.BufferedReader;
 import java.io.ByteArrayOutputStream;
 import java.io.IOException;
@ -229,16 +231,13 @@ public final class SimpleXMLParser {
            // we are in an unknown state before there's actual content
 			case UNKNOWN:
                if(character == '<') {
-                    saveState(TEXT);
+                    beginnOfTag((char) reader.read(), UNKNOWN);
                    state = TAG_ENCOUNTERED;
                }
                break;
            // we can encounter any content
 			case TEXT:
                if(character == '<') {
-                    flush();
+                    beginnOfTag((char) reader.read(), TEXT);
                    saveState(state);
                    state = TAG_ENCOUNTERED;
                } else if(character == '&') {
                    saveState(state);
                    entity.setLength(0);
@ -481,6 +480,27 @@ public final class SimpleXMLParser {
        }
    }
    /**
     * 处理标签的开头，若不在支持标签范围内，将<符号作为文本处理，例：<1111 (仿造浏览器的处理方式)
     */
    public void beginnOfTag(char c, int type) {
        previousCharacter = c;
        if (c == -1) {
            return;
        }
        if (c == '/' || HTMLWorker.tagsPrefixSupported.containsKey(c)) {
            if (type == TEXT) {
                flush();
            }
            saveState(TEXT);
            state = TAG_ENCOUNTERED;
            return;
        }
        text.append((char) character);
        nowhite = true;
    }
    /**
     * Gets a state from the stack
     * @return the previous state