ReducedHTMLParserTest.java

Bruno Aranda Fri, 11 Nov 2005 12:48:44 -0800

Mmm, definitely it is friday night. The message for the commit should
have been for MYFACES-809 and not MYFACES-508. When neurons begin to
stop you should keep away from the computer...


Thanks for your patience :-)

BTW, any chance to change to comment?

Regards,

Bruno

2005/11/11, [EMAIL PROTECTED] <[EMAIL PROTECTED]>:
> Author: baranda
> Date: Fri Nov 11 12:29:52 2005
> New Revision: 332640
>
> URL: http://svn.apache.org/viewcvs?rev=332640&view=rev
> Log:
> Applied patch for MYFACES-508. Thanks Simon Kitching
>
> Modified:
>     
> myfaces/tomahawk/trunk/src/java/org/apache/myfaces/component/html/util/ReducedHTMLParser.java
>     
> myfaces/tomahawk/trunk/src/test/org/apache/myfaces/component/html/util/ReducedHTMLParserTest.java
>
> Modified: 
> myfaces/tomahawk/trunk/src/java/org/apache/myfaces/component/html/util/ReducedHTMLParser.java
> URL: 
> http://svn.apache.org/viewcvs/myfaces/tomahawk/trunk/src/java/org/apache/myfaces/component/html/util/ReducedHTMLParser.java?rev=332640&r1=332639&r2=332640&view=diff
> ==============================================================================
> --- 
> myfaces/tomahawk/trunk/src/java/org/apache/myfaces/component/html/util/ReducedHTMLParser.java
>  (original)
> +++ 
> myfaces/tomahawk/trunk/src/java/org/apache/myfaces/component/html/util/ReducedHTMLParser.java
>  Fri Nov 11 12:29:52 2005
> @@ -20,7 +20,7 @@
>
>  /**
>   * A class which detects the open/close tags in an HTML document and reports
> - * them to a listener class.
> + * them to a listener class.
>   * <p>
>   * This is unfortunately necessary when using JSF with JSP, as tags in the 
> body
>   * of the document can need to output commands into the document at points
> @@ -52,81 +52,98 @@
>      private static final int STATE_IN_TAG = 2;
>      private static final int STATE_IN_MARKED_SECTION = 3;
>      private static final int STATE_EXPECTING_ETAGO = 4;
> -
> -    private int offset;
> -    private int lineNumber;
> -    private CharSequence seq;
> -    private CallbackListener listener;
> -
> +
> +    private int _offset;
> +    private int _lineNumber;
> +    private CharSequence _seq;
> +    private CallbackListener _listener;
> +
>      public static void parse(CharSequence seq, CallbackListener l)
>      {
>          new ReducedHTMLParser(seq, l).parse();
>      }
> -
> +
>      /**
>       * Constructor, package-scope for unit testing.
> -     *
> +     *
>       * @param s is the sequence of chars to parse.
>       * @param l is the listener to invoke callbacks on.
>       */
> -    ReducedHTMLParser(CharSequence s, CallbackListener l) {
> -        seq = s;
> -        listener = l;
> +    ReducedHTMLParser(CharSequence s, CallbackListener l)
> +    {
> +        _seq = s;
> +        _listener = l;
>      }
>
>      /**
>       * Return true if there are no more characters to parse.
>       */
> -    boolean isFinished() {
> -        return offset >= seq.length();
> +    boolean isFinished()
> +    {
> +        return _offset >= _seq.length();
>      }
>
> -    int getCurrentLineNumber() {
> -         return lineNumber;
> +    int getCurrentLineNumber()
> +    {
> +         return _lineNumber;
>      }
>
>      /**
>       * Advance the current parse position over any whitespace characters.
>       */
> -    void consumeWhitespace() {
> +    void consumeWhitespace()
> +    {
>          boolean crSeen = false;
>
> -        while (offset < seq.length()) {
> -            char c = seq.charAt(offset);
> -            if (!Character.isWhitespace(c)) {
> +        while (_offset < _seq.length())
> +        {
> +            char c = _seq.charAt(_offset);
> +            if (!Character.isWhitespace(c))
> +            {
>                  break;
>              }
>
>              // Track line number for error messages.
> -            if (c == '\r') {
> -                ++lineNumber;
> +            if (c == '\r')
> +            {
> +                ++_lineNumber;
>                  crSeen = true;
> -            } else if ((c == '\n') && !crSeen) {
> -                ++lineNumber;
> -            } else {
> +            }
> +            else if ((c == '\n') && !crSeen)
> +            {
> +                ++_lineNumber;
> +            }
> +            else
> +            {
>                  crSeen = false;
>              }
>
> -            ++offset;
> +            ++_offset;
>          }
>      }
>
>      /**
>       * Eat up a sequence of non-whitespace characters and return them.
>       */
> -    String consumeNonWhitespace() {
> -        int wordStart = offset;
> -        while (offset < seq.length()) {
> -            char c = seq.charAt(offset);
> -            if (Character.isWhitespace(c)) {
> +    String consumeNonWhitespace()
> +    {
> +        int wordStart = _offset;
> +        while (_offset < _seq.length())
> +        {
> +            char c = _seq.charAt(_offset);
> +            if (Character.isWhitespace(c))
> +            {
>                  break;
>              }
> -            ++offset;
> +            ++_offset;
>          }
> -        if (wordStart == offset) {
> +        if (wordStart == _offset)
> +        {
>              return null;
> -        } else {
> -            return seq.subSequence(wordStart, offset).toString();
> +        }
> +        else
> +        {
> +            return _seq.subSequence(wordStart, _offset).toString();
>          }
>      }
>
> @@ -134,28 +151,34 @@
>       * If the next chars in the input sequence exactly match the specified
>       * string then skip over them and return true.
>       * <p>
> -     * If there is not a match then leave the current parse position
> +     * If there is not a match then leave the current parse position
>       * unchanged and return false.
> -     *
> +     *
>       * @param s is the exact string to match.
>       * @return true if the input contains exactly the param s
>       */
> -    boolean consumeMatch(String s) {
> -        if (offset + s.length() > seq.length()) {
> +    boolean consumeMatch(String s)
> +    {
> +        if (_offset + s.length() > _seq.length())
> +        {
>              // seq isn't long enough to contain the specified string
>              return false;
>          }
>
>          int i = 0;
> -        while (i < s.length()) {
> -            if (seq.charAt(offset+i) == s.charAt(i)) {
> +        while (i < s.length())
> +        {
> +            if (_seq.charAt(_offset+i) == s.charAt(i))
> +            {
>                  ++i;
> -            } else {
> +            }
> +            else
> +            {
>                  return false;
>              }
>          }
> -
> -        offset += i;
> +
> +        _offset += i;
>          return true;
>      }
>
> @@ -164,42 +187,56 @@
>       * <p>
>       * TODO: implement this properly in compliance with spec
>       */
> -    String consumeElementName() {
> +    String consumeElementName()
> +    {
>          consumeWhitespace();
> -        int nameStart = offset;
> -        while (!isFinished()) {
> +        int nameStart = _offset;
> +        while (!isFinished())
> +        {
>              boolean ok = false;
> -            char c = seq.charAt(offset);
> -            if (Character.isLetterOrDigit(seq.charAt(offset))) {
> +            char c = _seq.charAt(_offset);
> +            if (Character.isLetterOrDigit(_seq.charAt(_offset)))
> +            {
>                  ok = true;
> -            } else if (c == '_') {
> +            }
> +            else if (c == '_')
> +            {
>                  ok = true;
> -            } else if (c == '-') {
> +            }
> +            else if (c == '-')
> +            {
>                  ok = true;
> -            } else if (c == ':') {
> +            }
> +            else if (c == ':')
> +            {
>                  ok = true;
>              }
> -
> -            if (!ok) {
> +
> +            if (!ok)
> +            {
>                  break;
>              }
>
> -            ++offset;
> +            ++_offset;
>          }
> -
> -        if (nameStart == offset) {
> +
> +        if (nameStart == _offset)
> +        {
>              return null;
> -        } else {
> -            return seq.subSequence(nameStart, offset).toString();
> +        }
> +        else
> +        {
> +            return _seq.subSequence(nameStart, _offset).toString();
>          }
>      }
>
>      /**
> -     * Eat up a sequence of chars which form a valid XML attribute name.
> +     * Eat up a sequence of chars which form a valid XML attribute name.
>       * <p>
>       * TODO: implement this properly in compliance with spec
>       */
> -    String consumeAttrName() {
> +    String consumeAttrName()
> +    {
>          // for now, assume elements and attributes have same rules
>          return consumeElementName();
>      }
> @@ -212,7 +249,8 @@
>       * This method assumes that the leading quote has already been
>       * consumed.
>       */
> -    String consumeString(char quote) {
> +    String consumeString(char quote)
> +    {
>          // TODO: should we consider a string to be terminated by a newline?
>          // that would help with runaway strings but I think that multiline
>          // strings *are* allowed...
> @@ -222,25 +260,37 @@
>          // few lines out in an error message isn't serious either.
>          StringBuffer stringBuf = new StringBuffer();
>          boolean escaping = false;
> -        while (!isFinished()) {
> -            char c = seq.charAt(offset);
> -            ++offset;
> -            if (c == quote) {
> -                if (!escaping) {
> +        while (!isFinished())
> +        {
> +            char c = _seq.charAt(_offset);
> +            ++_offset;
> +            if (c == quote)
> +            {
> +                if (!escaping)
> +                {
>                      break;
> -                } else {
> +                }
> +                else
> +                {
>                      stringBuf.append(c);
>                      escaping = false;
>                  }
> -            } else if (c == '\\') {
> -                if (escaping) {
> +            }
> +            else if (c == '\\')
> +            {
> +                if (escaping)
> +                {
>                      // append a real backslash
>                      stringBuf.append(c);
>                      escaping = false;
> -                } else {
> +                }
> +                else
> +                {
>                      escaping = true;
>                  }
> -            } else {
> +            }
> +            else
> +            {
>                  stringBuf.append(c);
>              }
>          }
> @@ -251,19 +301,25 @@
>       * Assuming we have already encountered "attrname=", consume the
>       * value part of the attribute definition. Note that unlike XML,
>       * HTML doesn't have to quote its attribute values.
> -     *
> -     * @return the attribute value. If the attr-value was quoted,
> +     *
> +     * @return the attribute value. If the attr-value was quoted,
>       * the returned value will not include the quote chars.
>       */
> -    String consumeAttrValue() {
> +    String consumeAttrValue()
> +    {
>          consumeWhitespace();
>          char singleQuote = '\'';
> -
> -        if (consumeMatch("'")) {
> +
> +        if (consumeMatch("'"))
> +        {
>              return consumeString('\'');
> -        } else if (consumeMatch("\"")) {
> +        }
> +        else if (consumeMatch("\""))
> +        {
>              return consumeString('"');
> -        } else {
> +        }
> +        else
> +        {
>              return consumeNonWhitespace();
>          }
>      }
> @@ -271,40 +327,53 @@
>      /**
>       * Discard all characters in the input until one in the specified
>       * string (character-set) is found.
> -     *
> +     *
>       * @param s is a set of characters that should not be discarded.
>       */
> -    void consumeExcept(String s) {
> +    void consumeExcept(String s)
> +    {
>          boolean crSeen = false;
>
> -        while (offset < seq.length()) {
> -            char c = seq.charAt(offset);
> -            if (s.indexOf(c) >= 0) {
> +        while (_offset < _seq.length())
> +        {
> +            char c = _seq.charAt(_offset);
> +            if (s.indexOf(c) >= 0)
> +            {
>                  // char is in the exception set
>                  return;
>              }
>
>               // Track line number for error messages.
> -             if (c == '\r') {
> -                 ++lineNumber;
> +             if (c == '\r')
> +             {
> +                 ++_lineNumber;
>                   crSeen = true;
> -             } else if ((c == '\n') && !crSeen) {
> -                 ++lineNumber;
> -             } else {
> +             }
> +             else if ((c == '\n') && !crSeen)
> +             {
> +                 ++_lineNumber;
> +             }
> +             else
> +             {
>                   crSeen = false;
>               }
> -
> +
>              // Track line number for error messages.
> -            if (c == '\r') {
> -                ++lineNumber;
> +            if (c == '\r')
> +            {
> +                ++_lineNumber;
>                  crSeen = true;
> -            } else if ((c == '\n') && !crSeen) {
> -                ++lineNumber;
> -            } else {
> +            }
> +            else if ((c == '\n') && !crSeen)
> +            {
> +                ++_lineNumber;
> +            }
> +            else
> +            {
>                  crSeen = false;
>              }
>
> -            ++offset;
> +            ++_offset;
>          }
>      }
>
> @@ -312,44 +381,52 @@
>       * Process the entire input buffer, invoking callbacks on the listener
>       * object as appropriate.
>       */
> -    void parse() {
> +    void parse()
> +    {
>          int state = STATE_READY;
> -
> +
>          int currentTagStart = -1;
>          String currentTagName = null;
>
> -        lineNumber = 1;
> -        offset = 0;
> -        int lastOffset = offset -1;
> -        while (offset < seq.length())
> +        _lineNumber = 1;
> +        _offset = 0;
> +        int lastOffset = _offset -1;
> +        while (_offset < _seq.length())
>          {
>              // Sanity check; each pass through this loop must increase the 
> offset.
>              // Failure to do this means a hang situation has occurred.
> -            if (offset <= lastOffset)
> +            if (_offset <= lastOffset)
>              {
>                  // throw new RuntimeException("Infinite loop detected in 
> ReducedHTMLParser");
>                  log.error("Infinite loop detected in ReducedHTMLParser; 
> parsing skipped");
>                  //return;
>              }
> -            lastOffset = offset;
> -
> -            if (state == STATE_READY) {
> +            lastOffset = _offset;
> +
> +            if (state == STATE_READY)
> +            {
>                  // in this state, nothing but "<" has any significance
>                  consumeExcept("<");
> -                if (isFinished()) {
> +                if (isFinished())
> +                {
>                      break;
>                  }
>
> -                if (consumeMatch("<!--")) {
> +                if (consumeMatch("<!--"))
> +                {
>                      // Note that whitespace is *not* permitted in <!--
>                      state = STATE_IN_COMMENT;
> -                } else if (consumeMatch("<![")) {
> -                    // Start of a "marked section", eg "<![CDATA" or
> -                    // "<![INCLUDE" or "<![IGNORE". These always terminate
> +                }
> +                else if (consumeMatch("<!["))
> +                {
> +                    // Start of a "marked section", eg "<![CDATA" or
> +                    // "<![INCLUDE" or "<![IGNORE". These always terminate
>                      // with "]]>"
>                      log.debug("Marked section found at line " + 
> getCurrentLineNumber());
>                      state = STATE_IN_MARKED_SECTION;
> -                } else if (consumeMatch("<!DOCTYPE")) {
> +                }
> +                else if (consumeMatch("<!DOCTYPE"))
> +                {
>                      log.debug("DOCTYPE found at line " + 
> getCurrentLineNumber());
>                      // we don't need to actually do anything here; the
>                      // tag can't contain a bare "<", so the first "<"
> @@ -359,94 +436,121 @@
>                      // that case there *will* be embedded < chars in the 
> document. However
>                      // that's very unlikely to be used in a JSF page, so 
> this is pretty low
>                      // priority.
> -                } else if (consumeMatch("<?")) {
> +                }
> +                else if (consumeMatch("<?"))
> +                {
>                      // xml processing instruction or <!DOCTYPE> tag
>                      // we don't need to actually do anything here; the
>                      // tag can't contain a bare "<", so the first "<"
>                      // indicates the start of the next real tag.
>                      log.debug("PI found at line " + getCurrentLineNumber());
> -                } else if (consumeMatch("</")) {
> -                    if (!processEndTag()) {
> +                }
> +                else if (consumeMatch("</"))
> +                {
> +                    if (!processEndTag())
> +                    {
>                          // message already logged
>                          return;
>                      }
>
>                      // stay in state READY
>                      state = STATE_READY;
> -                } else if (consumeMatch("<")) {
> +                }
> +                else if (consumeMatch("<"))
> +                {
>                      // We can't tell the user that the tag has closed until 
> after we have
>                      // processed any attributes and found the real end of 
> the tag. So save
>                      // the current info until the end of this tag.
> -                    currentTagStart = offset - 1;
> +                    currentTagStart = _offset - 1;
>                      currentTagName = consumeElementName();
> -                    if (currentTagName == null) {
> +                    if (currentTagName == null)
> +                    {
>                          log.warn("Invalid HTML; bare lessthan sign found at 
> line "
>                              + getCurrentLineNumber());
>                          // remain in STATE_READY; this isn't really the 
> start of
>                          // an xml element.
> -                    } else {
> +                    }
> +                    else
> +                    {
>                          state = STATE_IN_TAG;
>                      }
> -                } else {
> +                }
> +                else
> +                {
>                      // should never get here
>                      throw new Error("Internal error at line " + 
> getCurrentLineNumber());
>                  }
> -
> +
>                  continue;
>              }
>
> -            if (state == STATE_IN_COMMENT) {
> +            if (state == STATE_IN_COMMENT)
> +            {
>                  // TODO: handle "--  >", which is a valid way to close a
>                  // comment according to the specs.
>
>                  // in this state, nothing but "--" has any significance
>                  consumeExcept("-");
> -                if (isFinished()) {
> +                if (isFinished())
> +                {
>                      break;
>                  }
>
> -                if (consumeMatch("-->")) {
> +                if (consumeMatch("-->"))
> +                {
>                      state = STATE_READY;
> -                } else  {
> +                }
> +                else
> +                {
>                      // false call; hyphen is not end of comment
>                      consumeMatch("-");
>                  }
> -
> +
>                  continue;
>              }
> -
> -            if (state == STATE_IN_TAG) {
> +
> +            if (state == STATE_IN_TAG)
> +            {
>                  consumeWhitespace();
> -
> -                if (consumeMatch("/>")) {
> +
> +                if (consumeMatch("/>"))
> +                {
>                      // ok, end of element
>                      state = STATE_READY;
> -                    closedTag(currentTagStart, offset, currentTagName);
> -
> +                    closedTag(currentTagStart, _offset, currentTagName);
> +
>                      // and reset vars just in case...
>                      currentTagStart = -1;
>                      currentTagName = null;
> -                } else if (consumeMatch(">")) {
> -                    if (currentTagName.equalsIgnoreCase("script")
> -                        || currentTagName.equalsIgnoreCase("style")) {
> +                }
> +                else if (consumeMatch(">"))
> +                {
> +                    if (currentTagName.equalsIgnoreCase("script")
> +                        || currentTagName.equalsIgnoreCase("style"))
> +                    {
>                          // We've just started a special tag which can 
> contain anything except
>                          // the ETAGO marker ("</"). See
>                          // 
> http://www.w3.org/TR/REC-html40/appendix/notes.html#notes-specifying-data
>                          state = STATE_EXPECTING_ETAGO;
> -                    } else {
> +                    }
> +                    else
> +                    {
>                          state = STATE_READY;
>                      }
>
>                      // end of open tag, but not end of element
> -                    openedTag(currentTagStart, offset, currentTagName);
> -
> +                    openedTag(currentTagStart, _offset, currentTagName);
> +
>                      // and reset vars just in case...
>                      currentTagStart = -1;
>                      currentTagName = null;
> -                } else {
> +                }
> +                else
> +                {
>                      // xml attribute
>                      String attrName = consumeAttrName();
> -                    if (attrName == null) {
> +                    if (attrName == null)
> +                    {
>                          // Oops, we found something quite unexpected in this 
> tag.
>                          // The best we can do is probably to drop back to 
> looking
>                          // for "/>", though that does risk us 
> misinterpreting the
> @@ -455,55 +559,69 @@
>                                  + " at line " + getCurrentLineNumber());
>                          state = STATE_EXPECTING_ETAGO;
>                          // and consume one character
> -                        ++offset;
> -                    } else {
> +                        ++_offset;
> +                    }
> +                    else
> +                    {
>                          consumeWhitespace();
> -
> +
>                          // html can have "stand-alone" attributes with no 
> following equals sign
> -                        if (consumeMatch("=")) {
> +                        if (consumeMatch("="))
> +                        {
>                              String attrValue = consumeAttrValue();
>                          }
>                      }
>                  }
> -
> +
>                  continue;
>              }
>
> -            if (state == STATE_IN_MARKED_SECTION) {
> +            if (state == STATE_IN_MARKED_SECTION)
> +            {
>                  // in this state, nothing but "]]>" has any significance
>                  consumeExcept("]");
> -                if (isFinished()) {
> +                if (isFinished())
> +                {
>                      break;
>                  }
>
> -                if (consumeMatch("]]>")) {
> +                if (consumeMatch("]]>"))
> +                {
>                      state = STATE_READY;
> -                } else  {
> +                }
> +                else
> +                {
>                      // false call; ] is not end of cdata section
>                      consumeMatch("]");
>                  }
> -
> +
>                  continue;
>              }
>
> -            if (state == STATE_EXPECTING_ETAGO) {
> +            if (state == STATE_EXPECTING_ETAGO)
> +            {
>                  // The term "ETAGO" is the official spec term for "</".
>                  consumeExcept("<");
> -                if (isFinished()) {
> +                if (isFinished())
> +                {
>                      log.debug("Malformed input page; input terminated while 
> tag not closed.");
>                      break;
>                  }
>
> -                if (consumeMatch("</")) {
> -                    if (!processEndTag()) {
> +                if (consumeMatch("</"))
> +                {
> +                    if (!processEndTag())
> +                    {
>                          return;
>                      }
>                      state = STATE_READY;
> -                } else  {
> +                }
> +                else
> +                {
>                      // false call; < does not start an ETAGO
>                      consumeMatch("<");
>                  }
> -
> +
>                  continue;
>              }
>          }
> @@ -513,15 +631,17 @@
>       * Invoked when "&lt;/" has been seen in the input, this method
>       * handles the parsing of the end tag and the invocation of the
>       * appropriate callback method.
> -     *
> +     *
>       * @return true if the tag was successfully parsed, and false
>       * if there was a fatal parsing error.
>       */
> -    private boolean processEndTag() {
> -        int tagStart = offset - 2;
> +    private boolean processEndTag()
> +    {
> +        int tagStart = _offset - 2;
>          String tagName = consumeElementName();
>          consumeWhitespace();
> -        if (!consumeMatch(">")) {
> +        if (!consumeMatch(">"))
> +        {
>              log.error("Malformed end tag at line " + getCurrentLineNumber()
>                      + "; skipping parsing");
>              return false;
> @@ -529,7 +649,7 @@
>
>
>          // inform user that the tag has been closed
> -        closedTag(tagStart, offset, tagName);
> +        closedTag(tagStart, _offset, tagName);
>
>          // We can't verify that the tag names balance because this is HTML
>          // we are processing, not XML.
> @@ -538,38 +658,50 @@
>
>      /**
>       * Invoke a callback method to inform the listener that we have found a 
> start tag.
> -     *
> +     *
>       * @param startOffset
>       * @param endOffset
>       * @param tagName
>       */
> -    void openedTag(int startOffset, int endOffset, String tagName) {
> +    void openedTag(int startOffset, int endOffset, String tagName)
> +    {
>          //log.debug("Found open tag at " + startOffset + ":" + endOffset + 
> ":" + tagName);
>
> -        if ("head".equalsIgnoreCase(tagName)) {
> -            listener.openedStartTag(startOffset, HEAD_TAG);
> -            listener.closedStartTag(endOffset, HEAD_TAG);
> -        } else if ("body".equalsIgnoreCase(tagName)) {
> -            listener.openedStartTag(startOffset, BODY_TAG);
> -            listener.closedStartTag(endOffset, BODY_TAG);
> -        } else if ("script".equalsIgnoreCase(tagName)) {
> -            listener.openedStartTag(startOffset, SCRIPT_TAG);
> -            listener.closedStartTag(endOffset, SCRIPT_TAG);
> +        if ("head".equalsIgnoreCase(tagName))
> +        {
> +            _listener.openedStartTag(startOffset, HEAD_TAG);
> +            _listener.closedStartTag(endOffset, HEAD_TAG);
> +        }
> +        else if ("body".equalsIgnoreCase(tagName))
> +        {
> +            _listener.openedStartTag(startOffset, BODY_TAG);
> +            _listener.closedStartTag(endOffset, BODY_TAG);
> +        }
> +        else if ("script".equalsIgnoreCase(tagName))
> +        {
> +            _listener.openedStartTag(startOffset, SCRIPT_TAG);
> +            _listener.closedStartTag(endOffset, SCRIPT_TAG);
>          }
>      }
>
> -    void closedTag(int startOffset, int endOffset, String tagName) {
> +    void closedTag(int startOffset, int endOffset, String tagName)
> +    {
>          //log.debug("Found close tag at " + startOffset + ":" + endOffset + 
> ":" + tagName);
> -
> -        if ("head".equalsIgnoreCase(tagName)) {
> -            listener.openedEndTag(startOffset, HEAD_TAG);
> -            listener.closedEndTag(endOffset, HEAD_TAG);
> -        } else if ("body".equalsIgnoreCase(tagName)) {
> -            listener.openedEndTag(startOffset, BODY_TAG);
> -            listener.closedEndTag(endOffset, BODY_TAG);
> -        } else if ("script".equalsIgnoreCase(tagName)) {
> -            listener.openedEndTag(startOffset, SCRIPT_TAG);
> -            listener.closedEndTag(endOffset, SCRIPT_TAG);
> +
> +        if ("head".equalsIgnoreCase(tagName))
> +        {
> +            _listener.openedEndTag(startOffset, HEAD_TAG);
> +            _listener.closedEndTag(endOffset, HEAD_TAG);
> +        }
> +        else if ("body".equalsIgnoreCase(tagName))
> +        {
> +            _listener.openedEndTag(startOffset, BODY_TAG);
> +            _listener.closedEndTag(endOffset, BODY_TAG);
> +        }
> +        else if ("script".equalsIgnoreCase(tagName))
> +        {
> +            _listener.openedEndTag(startOffset, SCRIPT_TAG);
> +            _listener.closedEndTag(endOffset, SCRIPT_TAG);
>          }
>      }
>  }
>
> Modified: 
> myfaces/tomahawk/trunk/src/test/org/apache/myfaces/component/html/util/ReducedHTMLParserTest.java
> URL: 
> http://svn.apache.org/viewcvs/myfaces/tomahawk/trunk/src/test/org/apache/myfaces/component/html/util/ReducedHTMLParserTest.java?rev=332640&r1=332639&r2=332640&view=diff
> ==============================================================================
> --- 
> myfaces/tomahawk/trunk/src/test/org/apache/myfaces/component/html/util/ReducedHTMLParserTest.java
>  (original)
> +++ 
> myfaces/tomahawk/trunk/src/test/org/apache/myfaces/component/html/util/ReducedHTMLParserTest.java
>  Fri Nov 11 12:29:52 2005
> @@ -15,11 +15,6 @@
>   */
>  package org.apache.myfaces.component.html.util;
>
> -import java.io.IOException;
> -import java.io.Writer;
> -import java.util.ArrayList;
> -import java.util.List;
> -
>  import junit.framework.TestCase;
>
>  /**
> @@ -43,7 +38,7 @@
>              if (tagIdentifier == ReducedHTMLParser.HEAD_TAG)
>              {
>                  beforeHeadStart = charIndex;
> -            }
> +            }
>              else if (tagIdentifier == ReducedHTMLParser.BODY_TAG)
>              {
>                  beforeBodyStart = charIndex;
> @@ -67,7 +62,7 @@
>              if (tagIdentifier == ReducedHTMLParser.HEAD_TAG)
>              {
>                  beforeHeadEnd = charIndex;
> -            }
> +            }
>              else if (tagIdentifier == ReducedHTMLParser.BODY_TAG)
>              {
>                  beforeBodyEnd = charIndex;
> @@ -90,7 +85,7 @@
>          {
>          }
>      }
> -
> +
>      public void testIsFinished1()
>      {
>          CharSequence seq = "";
> @@ -98,7 +93,7 @@
>          ReducedHTMLParser parser = new ReducedHTMLParser(seq, listener);
>          assertTrue("Empty sequence is finished", parser.isFinished());
>      }
> -
> +
>      public void testIsFinished2()
>      {
>          CharSequence seq = "xx yy";
> @@ -113,8 +108,8 @@
>          parser.consumeNonWhitespace();
>          assertTrue("Sequence is finished", parser.isFinished());
>      }
> -
> -    public void testConsumeWhitespace()
> +
> +    public void testConsumeWhitespace()
>      {
>          CharSequence seq = "  \t  \r\n   xx    yy  ";
>          CallbackListener listener = new ParseCallbackListener();
> @@ -126,7 +121,7 @@
>          parser.consumeWhitespace();
>          String word1 = parser.consumeNonWhitespace();
>          assertEquals("xx found", "xx", word1);
> -
> +
>          // test that multiple calls don't consume anything but whitespace
>          parser.consumeWhitespace();
>          parser.consumeWhitespace();
> @@ -141,8 +136,8 @@
>          parser.consumeWhitespace();
>          assertTrue("Sequence is finished", parser.isFinished());
>      }
> -
> -    public void testConsumeNonWhitespace()
> +
> +    public void testConsumeNonWhitespace()
>      {
>          CharSequence seq = "xx yy zz";
>          CallbackListener listener = new ParseCallbackListener();
> @@ -150,15 +145,15 @@
>
>          String word1 = parser.consumeNonWhitespace();
>          assertEquals("xx found", "xx", word1);
> -
> +
>          // test that a call against whitespace returns null
>          String noWord = parser.consumeNonWhitespace();
>          assertNull("ConsumeNonWhitespace when whitespace is present", 
> noWord);
> -
> +
>          // test that no exception is generated for multiple calls
>          parser.consumeNonWhitespace();
>          parser.consumeNonWhitespace();
> -
> +
>          parser.consumeWhitespace();
>          String word2 = parser.consumeNonWhitespace();
>          assertEquals("yy found", "yy", word2);
> @@ -176,8 +171,8 @@
>          noWord = parser.consumeNonWhitespace();
>          assertNull("ConsumeNonWhitespace at end of sequence", noWord);
>      }
> -
> -    public void testConsumeMatch()
> +
> +    public void testConsumeMatch()
>      {
>          CharSequence seq = "xx <!-- yy --> zz";
>          CallbackListener listener = new ParseCallbackListener();
> @@ -185,64 +180,64 @@
>
>          // test non-match
>          assertFalse("Match non-matching pattern", 
> parser.consumeMatch("ffff"));
> -
> +
>          // test valid match. Also verifies that previous match failure didn't
>          // move the parsing offset.
>          assertTrue("Match matching pattern", parser.consumeMatch("xx"));
> -
> +
>          // this won't match until whitespace removed
>          assertFalse("Match non-matching pattern", 
> parser.consumeMatch("<!--"));
>          parser.consumeWhitespace();
>          assertTrue("Match matching pattern", parser.consumeMatch("<!--"));
> -
> +
>          // repeat
>          assertFalse("Match non-matching pattern", parser.consumeMatch("yy"));
>          parser.consumeWhitespace();
>          assertTrue("Match matching pattern", parser.consumeMatch("yy"));
> -
> +
>          parser.consumeWhitespace();
>          assertTrue("Match matching pattern", parser.consumeMatch("-->"));
> -
> +
>          // match at end of sequence
>          parser.consumeWhitespace();
>          assertTrue("Match matching pattern", parser.consumeMatch("zz"));
> -
> +
>          // check no exception on matching on finished sequence
>          assertFalse("Match non-matching pattern", parser.consumeMatch("aa"));
>      }
> -
> -    public void testConsumeElementName()
> +
> +    public void testConsumeElementName()
>      {
>          CharSequence seq = "  foo  t:foo t:FooBar t:foo_bar element-name/>";
>          CallbackListener listener = new ParseCallbackListener();
>          ReducedHTMLParser parser = new ReducedHTMLParser(seq, listener);
>
>          // test that consumeElementName will automatically skip any leading 
> whitespace
> -        String name1 = parser.consumeElementName();
> +        String name1 = parser.consumeElementName();
>          assertEquals("Element name matched", "foo", name1);
> -
> -        String name2 = parser.consumeElementName();
> +
> +        String name2 = parser.consumeElementName();
>          assertEquals("Element name matched", "t:foo", name2);
> -
> -        String name3 = parser.consumeElementName();
> +
> +        String name3 = parser.consumeElementName();
>          assertEquals("Element name matched", "t:FooBar", name3);
> -
> -        String name4 = parser.consumeElementName();
> +
> +        String name4 = parser.consumeElementName();
>          assertEquals("Element name matched", "t:foo_bar", name4);
> -
> -        String name5 = parser.consumeElementName();
> +
> +        String name5 = parser.consumeElementName();
>          assertEquals("Element name matched", "element-name", name5);
>      }
> -
> -    public void testConsumeStringBasic()
> +
> +    public void testConsumeStringBasic()
>      {
>          CharSequence s1 = "'string1' \"string2\"";
>          CallbackListener listener = new ParseCallbackListener();
>          ReducedHTMLParser parser = new ReducedHTMLParser(s1, listener);
>
> -        // Note that the consumeString method always expects the leading 
> quote to
> +        // Note that the consumeString method always expects the leading 
> quote to
>          // have been consumed already..
> -
> +
>          // test single-quote delimited
>          parser.consumeMatch("'");
>          String str1 = parser.consumeString('\'');
> @@ -254,11 +249,11 @@
>          String str2 = parser.consumeString('\"');
>          assertEquals("String correctly parsed", "string2", str2);
>      }
> -
> -    public void testConsumeStringEscapedQuote()
> +
> +    public void testConsumeStringEscapedQuote()
>      {
>          char quoteMark = '\'';
> -
> +
>          // build literal sequence 'don\'t quote me' not-in-the-string
>          StringBuffer buf = new StringBuffer();
>          buf.append(quoteMark);
> @@ -269,19 +264,19 @@
>          CallbackListener listener = new ParseCallbackListener();
>          ReducedHTMLParser parser = new ReducedHTMLParser(buf, listener);
>
> -        // Note that the consumeString method always expects the leading 
> quote to
> +        // Note that the consumeString method always expects the leading 
> quote to
>          // have been consumed already..
> -
> +
>          parser.consumeMatch("'");
>          String str1 = parser.consumeString('\'');
>          assertEquals("String correctly parsed", "don't quote me", str1);
>      }
> -
> -    public void testConsumeStringEscapedEscape()
> +
> +    public void testConsumeStringEscapedEscape()
>      {
>          char quoteMark = '\'';
>          char backSlash = '\\';
> -
> +
>          // build literal sequence 'don\\'t escape me' not-in-the-string
>          // The double-backslash should be treated as a single backslash
>          // which does *not* escape the following quote.
> @@ -297,15 +292,15 @@
>          CallbackListener listener = new ParseCallbackListener();
>          ReducedHTMLParser parser = new ReducedHTMLParser(buf, listener);
>
> -        // Note that the consumeString method always expects the leading 
> quote to
> +        // Note that the consumeString method always expects the leading 
> quote to
>          // have been consumed already..
> -
> +
>          parser.consumeMatch("'");
>          String str1 = parser.consumeString('\'');
>          assertEquals("String correctly parsed", "don" + backSlash, str1);
>      }
>
> -    public void testConsumeAttrValue()
> +    public void testConsumeAttrValue()
>      {
>          CharSequence seq = "  bare 'quoted 1' \"quoted 2\" bare2 ";
>          CallbackListener listener = new ParseCallbackListener();
> @@ -323,8 +318,8 @@
>          String val4 = parser.consumeAttrValue();
>          assertEquals("Attr value matched", "bare2", val4);
>      }
> -
> -    public void testConsumeExcept()
> +
> +    public void testConsumeExcept()
>      {
>          CharSequence seq = "abc$$#dd  ee#ff-gghh ii";
>          CallbackListener listener = new ParseCallbackListener();
> @@ -337,59 +332,59 @@
>          parser.consumeExcept("z-");
>          String val2 = parser.consumeNonWhitespace();
>          assertEquals("ConsumeExcept skipped expected chars", "-gghh", val2);
> -
> +
>          // check that consumeExcept will reach end of buffer ok if none of
>          // the desired chars are found
>          assertFalse(parser.isFinished());
>          parser.consumeExcept("z");
>          assertTrue(parser.isFinished());
> -
> +
>          // check that calling consumeExcept is safe at end-of-buffer
>          parser.consumeExcept("z");
>      }
>
>      // test parsing completes when a lessthan is not followed by an element 
> name,
>      // and there is just whitespace up to end of the input.
> -    public void testParseBadTagNoElementName1()
> +    public void testParseBadTagNoElementName1()
>      {
>          String s = "xxxx \n\n <# \n\n";
>          CallbackListener listener = new ParseCallbackListener();
>          ReducedHTMLParser parser = new ReducedHTMLParser(s, listener);
> -
> +
>          parser.parse();
>          assertTrue(parser.isFinished());
>      }
>
>      // test parsing completes when a lessthan is not followed by an element 
> name,
> -    public void testParseBadTagNoElementName2()
> +    public void testParseBadTagNoElementName2()
>      {
>          String s = "xxxx \n\n <# \n\n hi there";
>          CallbackListener listener = new ParseCallbackListener();
>          ReducedHTMLParser parser = new ReducedHTMLParser(s, listener);
> -
> +
>          parser.parse();
>          assertTrue(parser.isFinished());
>      }
>
>      // test parsing completes when an invalid char is found where an 
> attribute name
>      // is expected.
> -    public void testParseBadTagInvalidAttributeName()
> +    public void testParseBadTagInvalidAttributeName()
>      {
>          String s = "<foo )/>";
>          CallbackListener listener = new ParseCallbackListener();
>          ReducedHTMLParser parser = new ReducedHTMLParser(s, listener);
> -
> +
>          parser.parse();
>          assertTrue(parser.isFinished());
>      }
>
>      // test CDATA sections are handled
> -    public void testParseCDATA()
> +    public void testParseCDATA()
>      {
>          String s = "xx<head> <![CDATA[ <head> ]]> <body>";
>          ParseCallbackListener listener = new ParseCallbackListener();
>          ReducedHTMLParser parser = new ReducedHTMLParser(s, listener);
> -
> +
>          parser.parse();
>          assertTrue(parser.isFinished());
>          assertEquals("CDATA works", 8, listener.afterHeadStart);
> @@ -397,12 +392,12 @@
>      }
>
>      // test PI sections are handled
> -    public void testParsePI()
> +    public void testParsePI()
>      {
>          String s = "<?xml version=\"1.0\"?> xx<head> ";
>          ParseCallbackListener listener = new ParseCallbackListener();
>          ReducedHTMLParser parser = new ReducedHTMLParser(s, listener);
> -
> +
>          parser.parse();
>          assertTrue(parser.isFinished());
>          assertEquals("PI works", 30, listener.afterHeadStart);
> @@ -410,7 +405,7 @@
>
>      // Test script element support; the spec states that a <script> or
>      // <style> tag can contain anything except "/>"
> -    public void testScript()
> +    public void testScript()
>      {
>          String s1 = "<head>";
>          String s2 = "<script type='text/javascript'>"
> @@ -430,7 +425,7 @@
>
>          ParseCallbackListener listener = new ParseCallbackListener();
>          ReducedHTMLParser parser = new ReducedHTMLParser(buf.toString(), 
> listener);
> -
> +
>          parser.parse();
>          assertTrue(parser.isFinished());
>          assertEquals("Script works", s1.length(), listener.afterHeadStart);
> @@ -443,7 +438,7 @@
>      }
>
>      // test the full parse method
> -    public void testParse()
> +    public void testParse()
>      {
>          String s0 = "<!DOCTYPE PUBLIC \"sss\" \"http:foo\">\n";
>          String s1 = "<html><head>";
> @@ -474,15 +469,15 @@
>          ReducedHTMLParser parser = new ReducedHTMLParser(buf, listener);
>
>          parser.parse();
> -
> +
>          // check that listener has correctly computed the offset to the char 
> just
>          // before the </head> tag starts.
>          int afterHeadStart = s0.length() + s1.length();
>          assertEquals("Pos after <head> tag ", afterHeadStart, 
> listener.afterHeadStart);
> -
> +
>          int beforeBodyStart = afterHeadStart + s2.length() + s3.length();
>          assertEquals("Pos before <body> tag", beforeBodyStart, 
> listener.beforeBodyStart);
> -
> +
>          int afterBodyStart = beforeBodyStart + s4.length();
>          assertEquals("Pos after <body> tag", afterBodyStart, 
> listener.afterBodyStart);
>      }
>
>
>

Re: svn commit: r332640 - in /myfaces/tomahawk/trunk/src: java/org/apache/myfaces/component/html/util/ReducedHTMLParser.java test/org/apache/myfaces/component/html/util/ReducedHTMLParserTest.java

Reply via email to