alvinalexander.com | career | drupal | java | mac | mysql | perl | scala | uml | unix  

What this is

This file is included in the DevDaily.com "Java Source Code Warehouse" project. The intent of this project is to help you "Learn Java by Example" TM.

Other links

The source code

/*
 * JSPTokenMarker.java - JSP token marker
 * Copyright (C) 2001 by Romain Guy
 * Based on HTMLTokenMarker by Slava Pestov & Romain Guy
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; either version 2
 * of the License, or any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 */
package org.gjt.sp.jedit.syntax;

import javax.swing.text.Segment;

/**
 * JSP token marker.
 * @author Romain Guy
 */
 
public class JSPTokenMarker extends TokenMarker
{
  public static final byte JAVASCRIPT = Token.INTERNAL_FIRST;
  public static final byte HTML_LITERAL_QUOTE = Token.INTERNAL_FIRST + 1;
  public static final byte HTML_LITERAL_NO_QUOTE = Token.INTERNAL_FIRST + 2;
  public static final byte INSIDE_TAG = Token.INTERNAL_FIRST + 3;
  public static final byte JSP_NULL     = Token.NULL     + (Token.INTERNAL_FIRST + 4);
  public static final byte JSP_KEYWORD1 = Token.KEYWORD1 + (Token.INTERNAL_FIRST + 4);
  public static final byte JSP_KEYWORD2 = Token.KEYWORD2 + (Token.INTERNAL_FIRST + 4);
  public static final byte JSP_KEYWORD3 = Token.KEYWORD3 + (Token.INTERNAL_FIRST + 4);
  public static final byte JSP_COMMENT1 = Token.COMMENT1 + (Token.INTERNAL_FIRST + 4);
  public static final byte JSP_COMMENT2 = Token.COMMENT2 + (Token.INTERNAL_FIRST + 4);
  public static final byte JSP_METHOD   = Token.METHOD   + (Token.INTERNAL_FIRST + 4);
  public static final byte JSP_LITERAL1 = Token.LITERAL1 + (Token.INTERNAL_FIRST + 4);
  public static final byte JSP_LITERAL2 = Token.LITERAL2 + (Token.INTERNAL_FIRST + 4);
  public static final byte JSP_LABEL    = Token.LABEL    + (Token.INTERNAL_FIRST + 4);

  public JSPTokenMarker()
  {
    this.js = true;
    keywords = JavaScriptTokenMarker.getKeywords();
    javaKeywords = JavaTokenMarker.getKeywords();
  }

  public byte markTokensImpl(byte token, Segment line, int lineIndex)
  {
    char[] array = line.array;
    int offset = line.offset;
    lastOffset = offset;
    lastKeyword = offset;
    int length = line.count + offset;
    boolean backslash = false;
    lastWhitespace = offset - 1;

    loop:
    for (int i = offset; i < length; i++)
    {
      int i1 = (i + 1);

      char c = array[i];
      if (c == '\\')
      {
        backslash = !backslash;
        if (token == JAVASCRIPT || token >= JSP_NULL)
          continue;
      }

      switch (token)
      {
        case Token.NULL: // HTML text
          backslash = false;
          switch (c)
          {
            case '\\':
              addToken(i - lastOffset, token);
              lastOffset = lastKeyword = i;
              token = Token.OPERATOR;
              break;
            case '<':
              addToken(i - lastOffset, token);
              lastOffset = lastKeyword = i;
              if (SyntaxUtilities.regionMatches(false, line, i1, "!--"))
              {
                i += 3;
                token = Token.COMMENT1;
              } else if (js && SyntaxUtilities.regionMatches(true, line, i1, "script")) {
                addToken(1, Token.KEYWORD1);
                //addToken(6, Token.METHOD);
                //lastOffset = lastKeyword = (i += 7);
                lastOffset = lastKeyword = i1;
                lastWhitespace = i;
                token = Token.METHOD;//JAVASCRIPT;
                javascript = true;
              } else if (SyntaxUtilities.regionMatches(true, line, i1, "%@")) {
                addToken(2, Token.OPERATOR);
                addToken(1, Token.LABEL);
                lastOffset = lastKeyword = (i += 3);
                lastWhitespace = (i + 2);
                token = JSP_LABEL;
              } else if (SyntaxUtilities.regionMatches(true, line, i1, "%=")) {
                addToken(3, Token.OPERATOR);
                lastOffset = lastKeyword = (i += 3);
                lastWhitespace = (i + 2);
                token = JSP_NULL;
              } else if (SyntaxUtilities.regionMatches(true, line, i1, "%!")) {
                addToken(3, Token.OPERATOR);
                lastOffset = lastKeyword = (i += 3);
                lastWhitespace = (i + 2);
                token = JSP_NULL;
              } else if (SyntaxUtilities.regionMatches(true, line, i1, "%")) {
                addToken(2, Token.OPERATOR);
                lastOffset = lastKeyword = (i += 2);
                lastWhitespace = i1;
                token = JSP_NULL;
              } else {
                addToken(1, Token.KEYWORD1);
                lastOffset = lastKeyword = i1;
                token = Token.METHOD;
              }
              break;
            case '&':
              addToken(i - lastOffset, token);
              lastOffset = lastKeyword = i;
              token = Token.KEYWORD2;
              break;
          }
          break;
        case Token.OPERATOR:
          backslash = false;
          if (c != '<')
          {
            addToken(i1 - lastOffset, token);
            lastOffset = lastKeyword = i1;
            token = Token.NULL;
          }
          break;
        case Token.METHOD: // Inside a tag
          backslash = false;
          if (c == '>')
          {
            addToken(i - lastOffset, token);
            addToken(1, Token.KEYWORD1);
            lastOffset = lastKeyword = i1;
            if (!javascript)
              token = Token.NULL;
            else
            {
              javascript = false;
              token = JAVASCRIPT;
            }
          } else if (c == ':') {
            addToken(i1 - lastOffset, Token.LITERAL2);
            lastOffset = lastKeyword = i1;
          } else if (c == ' ' || c == '\t') {
            addToken(i1 - lastOffset, token);
            lastOffset = lastKeyword = i1;
            token = INSIDE_TAG;
          }
          break;
        case INSIDE_TAG:
          backslash = false;
          if (c == '>')
          {
            addToken(i - lastOffset, Token.METHOD);
            addToken(1, Token.KEYWORD1);
            lastOffset = lastKeyword = i1;
            if (!javascript)
              token = Token.NULL;
            else
            {
              javascript = false;
              token = JAVASCRIPT;
            }
          } else if (c == '/' || c == '?') {
            addToken(1, Token.METHOD);
            lastOffset = lastKeyword = i1;
            token = Token.METHOD;
          } else {//if (c != ' ' && c != '\t') {
            addToken(i - lastOffset, Token.NULL);
            lastOffset = lastKeyword = i;
            token = Token.KEYWORD3;
          }
          break;
        case Token.KEYWORD2: // Inside an entity
          backslash = false;
          if (c == ';')
          {
            addToken(i1 - lastOffset, token);
            lastOffset = lastKeyword = i1;
            token = Token.NULL;
          }
          break;
        case Token.KEYWORD3: // Inside an attribute
          backslash = false;
          if (c == '/' || c == '?')
          {
            addToken(i - lastOffset, token);
            addToken(1, Token.METHOD);
            lastOffset = lastKeyword = i1;
            //token = INSIDE_TAG;
          } else if (c == '=') {
            addToken(i - lastOffset, token);
            addToken(1, Token.LABEL);
            lastOffset = lastKeyword = i1;
            if (i1 < array.length && array[i1] == '"')
            {
              token = HTML_LITERAL_QUOTE;
              i++;
            } else {
              token = HTML_LITERAL_NO_QUOTE;
            }
          } else if (c == '>') {
            addToken(i - lastOffset, token);
            addToken(1, Token.KEYWORD1);
            lastOffset = lastKeyword = i1;
            token = Token.NULL;
          } else if (c == ' ' || c == '\t') {
            addToken(i1 - lastOffset, token);
            lastOffset = lastKeyword = i1;
            token = INSIDE_TAG;
          }
          break;
        case HTML_LITERAL_QUOTE:
          backslash = false;
          if (c == '"')
          {
            addToken(i1 - lastOffset, Token.LITERAL1);
            lastOffset = lastKeyword = i1;
            token = INSIDE_TAG;
          }
          break;
        case HTML_LITERAL_NO_QUOTE:
          backslash = false;
          if (c == ' ' || c == '\t')
          {
            addToken(i1 - lastOffset, Token.LITERAL1);
            lastOffset = lastKeyword = i1;
            token = INSIDE_TAG;
          } else if (c == '>') {
            addToken(i - lastOffset, Token.LITERAL1);
            addToken(1, Token.KEYWORD1);
            lastOffset = lastKeyword = i1;
            token = Token.NULL;
          }
          break;
        case Token.COMMENT1: // Inside a comment
          backslash = false;
          if (SyntaxUtilities.regionMatches(false, line, i, "-->"))
          {
            addToken((i + 3) - lastOffset, token);
            lastOffset = lastKeyword = i + 3;
            token = Token.NULL;
          }
          break;
        case JAVASCRIPT: // Inside a JavaScript
          switch (c)
          {
            case '<':
              backslash = false;
              doJSKeyword(line, i, c);
              if (SyntaxUtilities.regionMatches(true, line, i1, "/script>"))
              {
                addToken(i - lastOffset, Token.NULL);
                addToken(1, Token.KEYWORD1);
                addToken(7, Token.METHOD);
                addToken(1, Token.KEYWORD1);
                lastOffset = lastKeyword = (i += 9);
                token = Token.NULL;
              }
              break;
            case '(':
              if (backslash)
              {
                doJSKeyword(line, i, c);
                backslash = false;
              } else {
                if (doJSKeyword(line, i, c))
                  break;
                addToken(lastWhitespace - lastOffset + 1, Token.NULL);
                addToken(i - lastWhitespace - 1, Token.METHOD);
                addToken(1, Token.NULL);
                token = JAVASCRIPT;
                lastOffset = lastKeyword = i1;
                lastWhitespace = i;
              }
              break;
            case '"':
              if (backslash)
                backslash = false;
              else
              {
                doJSKeyword(line, i, c);
                addToken(i - lastOffset, Token.NULL);
                lastOffset = lastKeyword = i;
                token = Token.LITERAL1;
              }
              break;
            case '\'':
              if (backslash)
                backslash = false;
              else
              {
                doJSKeyword(line, i, c);
                addToken(i - lastOffset, Token.NULL);
                lastOffset = lastKeyword = i;
                token = Token.LITERAL2;
              }
              break;
            case '/':
              backslash = false;
              doJSKeyword(line, i, c);
              if (length - i > 1)
              {
                addToken(i - lastOffset, Token.NULL);
                lastOffset = lastKeyword = i;
                if (array[i1] == '/')
                {
                  addToken(length - i, Token.COMMENT2);
                  lastOffset = lastKeyword = length;
                  break loop;
                } else if (array[i1] == '*') {
                  token = Token.COMMENT2;
                }
              }
              break;
            default:
              backslash = false;
              if (!Character.isLetterOrDigit(c) && c != '_')
                doJSKeyword(line, i, c);
              if (CTokenMarker.METHOD_DELIMITERS.indexOf(c) != -1)
              {
                lastWhitespace = i;
              }
              break;
          }
          break;
        case Token.LITERAL1: // JavaScript "..."
          if (backslash)
            backslash = false;
          else if (c == '"')
          {
            addToken(i1 - lastOffset, Token.LITERAL1);
            lastOffset = lastKeyword = i1;
            token = JAVASCRIPT;
          }
          break;
        case Token.LITERAL2: // JavaScript '...'
          if (backslash)
            backslash = false;
          else if (c == '\'')
          {
            addToken(i1 - lastOffset, Token.LITERAL1);
            lastOffset = lastKeyword = i1;
            token = JAVASCRIPT;
          }
          break;
        case Token.COMMENT2: // Inside a JavaScript comment
          backslash = false;
          if (c == '*' && length - i > 1 && array[i1] == '/')
          {
            addToken((i += 2) - lastOffset, Token.COMMENT1);
            lastOffset = lastKeyword = i;
            token = JAVASCRIPT;
          }
          break;
        default:
          if (token > Token.INTERNAL_FIRST + 3)
          {
            switch (token)
            {
              case JSP_NULL:
                switch(c)
                {
                case '%':
                  backslash = false;
                  if (length - i > 1 && array[i1] == '>')
                  {
                    addToken(i - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
                    addToken(2, Token.OPERATOR);
                    lastOffset = lastKeyword = (i += 1) + 1;
                    token = Token.NULL;
                  } else {
                    addToken(i - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
                    addToken(1, Token.NULL);
                    lastOffset = lastKeyword = lastWhitespace = (i += 1);
                    token = JSP_NULL;
                  }
                  break;
                case '(':
                  if (backslash)
                  {
                    doJavaKeyword(line, i, c);
                    backslash = false;
                  } else {
                    if (doJavaKeyword(line, i, c))
                      break;
                    addToken(lastWhitespace - lastOffset + 1, (byte) (token - (Token.INTERNAL_FIRST + 4)));
                    addToken(i - lastWhitespace - 1, Token.METHOD);
                    addToken(1, Token.NULL);
                    token = JSP_NULL;
                    lastOffset = lastKeyword = i1;
                    lastWhitespace = i;
                  }
                  break;
                case '"':
                  doJavaKeyword(line, i, c);
                  if(backslash)
                    backslash = false;
                  else
                  {
                    addToken(i - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
                    token = JSP_LITERAL1;
                    lastOffset = lastKeyword = i;
                  }
                  break;
                case '\'':
                  doJavaKeyword(line, i, c);
                  if (backslash)
                    backslash = false;
                  else
                  {
                    addToken(i - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
                    token = JSP_LITERAL2;
                    lastOffset = lastKeyword = i;
                  }
                  break;
                case ':':
                  if(lastKeyword == offset)
                  {
                    if (doJavaKeyword(line, i, c))
                      break;
                    backslash = false;
                    addToken(i1 - lastOffset, Token.LABEL);
                    lastOffset = lastKeyword = i1;
                  }
                  else if(doJavaKeyword(line, i, c))
                    break;
                  break;
                case '/':
                  backslash = false;
                  doJavaKeyword(line, i, c);
                  if(length - i > 1)
                  {
                    switch(array[i1])
                    {
                      case '*':
                        addToken(i - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
                        lastOffset = lastKeyword = i;
                        if(length - i > 2 && array[i + 2] == '*')
                          token = JSP_COMMENT2;
                        else
                          token = JSP_COMMENT1;
                        break;
                      case '/':
                        addToken(i - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
                        addToken(length - i, Token.COMMENT1);
                        lastOffset = lastKeyword = length;
                        break loop;
                    }
                  }
                  break;
                default:
                  backslash = false;
                  if (!Character.isLetterOrDigit(c) && c != '_')
                    doJavaKeyword(line, i, c);
                  if (CTokenMarker.METHOD_DELIMITERS.indexOf(c) != -1)
                    lastWhitespace = i;
                  break;
                }
                break;
              case JSP_COMMENT1:
              case JSP_COMMENT2:
                backslash = false;
                if (c == '*' && length - i > 1)
                {
                  if (array[i1] == '/')
                  {
                    i++;
                    addToken((i + 1) - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
                    token = JSP_NULL;
                    lastOffset = lastKeyword = i + 1;
                    lastWhitespace = i;
                  }
                }
                break;
              case JSP_LABEL:
                backslash = false;
                if (c == ' ' || c == '\t')
                {
                  addToken(i1 - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
                  lastOffset = lastKeyword = i1;
                } else if (c == '=') {
                  addToken(i - lastOffset, Token.KEYWORD3);
                  addToken(1, Token.LABEL);
                  lastOffset = lastKeyword = i1;
                } else if (c == '\'') {
                  addToken(i - lastOffset, Token.KEYWORD3);
                  token = JSP_LITERAL2;
                  lastOffset = lastKeyword = i;
                } else if (c == '"') {
                  addToken(i - lastOffset, Token.KEYWORD3);
                  token = JSP_LITERAL1;
                  lastOffset = lastKeyword = i;
                }
                break;
              case JSP_LITERAL1:
                if (backslash)
                  backslash = false;
                else if (c == '"')
                {
                  addToken(i1 - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
                  token = JSP_NULL;
                  lastOffset = lastKeyword = i1;
                  lastWhitespace = i;
                }
                break;
              case JSP_LITERAL2:
                if (backslash)
                  backslash = false;
                else if (c == '\'')
                {
                  addToken(i1 - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
                  token = JSP_NULL;
                  lastOffset = lastKeyword = i1;
                  lastWhitespace = i;
                }
                break;
              default:
                throw new InternalError("Invalid state: " + token);
            }
          } else
            throw new InternalError("Invalid state: " + token);
      }
    }

    switch (token)
    {
      case Token.LITERAL1:
      case Token.LITERAL2:
        addToken(length - lastOffset, Token.INVALID);
        token = JAVASCRIPT;
        break;
      case Token.KEYWORD2:
        addToken(length - lastOffset, Token.INVALID);
        token = Token.NULL;
        break;
      case JAVASCRIPT:
        doJSKeyword(line, length, '\0');
        addToken(length - lastOffset, Token.NULL);
        break;
      case Token.COMMENT2:
        addToken(length - lastOffset, Token.COMMENT1);
        break;
      case INSIDE_TAG:
        break;
      case HTML_LITERAL_QUOTE: case HTML_LITERAL_NO_QUOTE:
        addToken(length - lastOffset, Token.LITERAL1);
        break;
      default:
        if (token < JSP_NULL)
          addToken(length - lastOffset, token);
        else
        {
          if (token == JSP_NULL)
            doJavaKeyword(line, length, '\0');

          switch(token)
          {
            case JSP_LITERAL1:
            case JSP_LITERAL2:
              addToken(length - lastOffset, Token.INVALID);
              token = JSP_NULL;
              break;
            case JSP_KEYWORD2:
              addToken(length - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
              if (!backslash)
                token = JSP_NULL;
              break;
            default:
              addToken(length - lastOffset, (byte) (token - (Token.INTERNAL_FIRST + 4)));
              break;
          }
        }
        break;
    }

    return token;
  }

  // private members
  private KeywordMap keywords;
  private KeywordMap javaKeywords;
  private boolean js;
  private boolean javascript;
  private int lastOffset;
  private int lastKeyword;
  private int lastWhitespace;

  private boolean doJSKeyword(Segment line, int i, char c)
  {
    return doKeyword(line, i, c, true);
  }

  private boolean doJavaKeyword(Segment line, int i, char c)
  {
    return doKeyword(line, i, c, false);
  }

  private boolean doKeyword(Segment line, int i, char c, boolean javaScript)
  {
    int i1 = i + 1;

    int len = i - lastKeyword;
    byte id = (javaScript ? keywords : javaKeywords).lookup(line, lastKeyword, len);
    if (id != Token.NULL)
    {
      if (lastKeyword != lastOffset)
        addToken(lastKeyword - lastOffset, Token.NULL);
      addToken(len, id);
      lastKeyword = i1;
      lastOffset = i;
      lastWhitespace = i;
      return true;
    }
    lastKeyword = i1;
    return false;
  }
}
... this post is sponsored by my books ...

#1 New Release!

FP Best Seller

 

new blog posts

 

Copyright 1998-2021 Alvin Alexander, alvinalexander.com
All Rights Reserved.

A percentage of advertising revenue from
pages under the /java/jwarehouse URI on this website is
paid back to open source projects.