/* * PythonTokenMarker.java - Python token marker * Copyright (C) 1999 Jonathan Revusky * Copyright (C) 1998, 1999 Slava Pestov * * You may use and modify this package for any purpose. Redistribution is * permitted, in both source and binary form, provided that this notice * remains intact in all source distributions of this package. */ import javax.swing.text.Segment; /** * Python token marker. * * @author Jonathan Revusky * @version $Id: PythonTokenMarker.java,v 1.3 1999/12/14 04:20:35 sp Exp $ */ public class PythonTokenMarker extends TokenMarker { private static final byte TRIPLEQUOTE1 = Token.INTERNAL_FIRST; private static final byte TRIPLEQUOTE2 = Token.INTERNAL_LAST; public PythonTokenMarker() { this.keywords = getKeywords(); } public byte markTokensImpl(byte token, Segment line, int lineIndex) { char[] array = line.array; int offset = line.offset; lastOffset = offset; lastKeyword = offset; int length = line.count + offset; boolean backslash = false; loop: for(int i = offset; i < length; i++) { int i1 = (i+1); char c = array[i]; if(c == '\\') { backslash = !backslash; continue; } switch(token) { case Token.NULL: switch(c) { case '#': if(backslash) backslash = false; else { doKeyword(line,i,c); addToken(i - lastOffset,token); addToken(length - i,Token.COMMENT1); lastOffset = lastKeyword = length; break loop; } break; case '"': doKeyword(line,i,c); if(backslash) backslash = false; else { addToken(i - lastOffset,token); if(SyntaxUtilities.regionMatches(false, line,i1,"\"\"")) { token = TRIPLEQUOTE1; } else { token = Token.LITERAL1; } lastOffset = lastKeyword = i; } break; case '\'': doKeyword(line,i,c); if(backslash) backslash = false; else { addToken(i - lastOffset,token); if(SyntaxUtilities.regionMatches(false, line,i1,"''")) { token = TRIPLEQUOTE2; } else { token = Token.LITERAL2; } lastOffset = lastKeyword = i; } break; default: backslash = false; if(!Character.isLetterOrDigit(c) && c != '_') doKeyword(line,i,c); break; } break; case Token.LITERAL1: if(backslash) backslash = false; else if(c == '"') { addToken(i1 - lastOffset,token); token = Token.NULL; lastOffset = lastKeyword = i1; } break; case Token.LITERAL2: if(backslash) backslash = false; else if(c == '\'') { addToken(i1 - lastOffset,Token.LITERAL1); token = Token.NULL; lastOffset = lastKeyword = i1; } break; case TRIPLEQUOTE1: if(backslash) backslash = false; else if(SyntaxUtilities.regionMatches(false, line,i,"\"\"\"")) { addToken((i+=4) - lastOffset, Token.LITERAL1); token = Token.NULL; lastOffset = lastKeyword = i; } break; case TRIPLEQUOTE2: if(backslash) backslash = false; else if(SyntaxUtilities.regionMatches(false, line,i,"'''")) { addToken((i+=4) - lastOffset, Token.LITERAL1); token = Token.NULL; lastOffset = lastKeyword = i; } break; default: throw new InternalError("Invalid state: " + token); } } switch(token) { case TRIPLEQUOTE1: case TRIPLEQUOTE2: addToken(length - lastOffset,Token.LITERAL1); break; case Token.NULL: doKeyword(line,length,'\0'); default: addToken(length - lastOffset,token); break; } return token; } public static KeywordMap getKeywords() { if (pyKeywords == null) { pyKeywords = new KeywordMap(false); pyKeywords.add("and",Token.KEYWORD3); pyKeywords.add("not",Token.KEYWORD3); pyKeywords.add("or",Token.KEYWORD3); pyKeywords.add("if",Token.KEYWORD1); pyKeywords.add("for",Token.KEYWORD1); pyKeywords.add("assert",Token.KEYWORD1); pyKeywords.add("break",Token.KEYWORD1); pyKeywords.add("continue",Token.KEYWORD1); pyKeywords.add("elif",Token.KEYWORD1); pyKeywords.add("else",Token.KEYWORD1); pyKeywords.add("except",Token.KEYWORD1); pyKeywords.add("exec",Token.KEYWORD1); pyKeywords.add("finally",Token.KEYWORD1); pyKeywords.add("raise",Token.KEYWORD1); pyKeywords.add("return",Token.KEYWORD1); pyKeywords.add("try",Token.KEYWORD1); pyKeywords.add("while",Token.KEYWORD1); pyKeywords.add("def",Token.KEYWORD2); pyKeywords.add("class",Token.KEYWORD2); pyKeywords.add("del",Token.KEYWORD2); pyKeywords.add("from",Token.KEYWORD2); pyKeywords.add("global",Token.KEYWORD2); pyKeywords.add("import",Token.KEYWORD2); pyKeywords.add("in",Token.KEYWORD2); pyKeywords.add("is",Token.KEYWORD2); pyKeywords.add("lambda",Token.KEYWORD2); pyKeywords.add("pass",Token.KEYWORD2); pyKeywords.add("print",Token.KEYWORD2); } return pyKeywords; } // private members private static KeywordMap pyKeywords; private KeywordMap keywords; private int lastOffset; private int lastKeyword; private boolean doKeyword(Segment line, int i, char c) { int i1 = i+1; int len = i - lastKeyword; byte id = keywords.lookup(line,lastKeyword,len); if(id != Token.NULL) { if(lastKeyword != lastOffset) addToken(lastKeyword - lastOffset,Token.NULL); addToken(len,id); lastOffset = i; } lastKeyword = i1; return false; } }