| /* |
| * Copyright 2000-2014 JetBrains s.r.o. |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| package org.jetbrains.plugins.groovy.findUsages; |
| |
| import com.intellij.lang.cacheBuilder.WordOccurrence; |
| import com.intellij.lang.cacheBuilder.WordsScanner; |
| import com.intellij.lexer.Lexer; |
| import com.intellij.psi.tree.IElementType; |
| import com.intellij.util.Processor; |
| import org.jetbrains.plugins.groovy.lang.lexer.GroovyLexer; |
| import org.jetbrains.plugins.groovy.lang.lexer.GroovyTokenTypes; |
| import org.jetbrains.plugins.groovy.lang.lexer.TokenSets; |
| |
| /** |
| * @author ven |
| */ |
| class GroovyWordsScanner implements WordsScanner |
| { |
| private final Lexer myLexer; |
| public GroovyWordsScanner() |
| { |
| myLexer = new GroovyLexer(); |
| } |
| |
| @Override |
| public void processWords(CharSequence fileText, Processor<WordOccurrence> processor) { |
| myLexer.start(fileText); |
| WordOccurrence occurrence = null; // shared occurrence |
| |
| while (myLexer.getTokenType() != null) { |
| final IElementType type = myLexer.getTokenType(); |
| if (type == GroovyTokenTypes.mIDENT || TokenSets.KEYWORDS.contains(type)) { |
| if (occurrence == null) occurrence = new WordOccurrence(fileText,myLexer.getTokenStart(),myLexer.getTokenEnd(), WordOccurrence.Kind.CODE); |
| else occurrence.init(fileText,myLexer.getTokenStart(),myLexer.getTokenEnd(), WordOccurrence.Kind.CODE); |
| if (!processor.process(occurrence)) return; |
| } |
| else if (TokenSets.COMMENT_SET.contains(type)) { |
| if (!stripWords(processor, fileText,myLexer.getTokenStart(),myLexer.getTokenEnd(), WordOccurrence.Kind.COMMENTS, occurrence)) return; |
| } |
| else if (TokenSets.STRING_LITERALS.contains(type)) { |
| if (!stripWords(processor, fileText, myLexer.getTokenStart(), myLexer.getTokenEnd(), WordOccurrence.Kind.LITERALS, occurrence)) { |
| return; |
| } |
| |
| if (type == GroovyTokenTypes.mSTRING_LITERAL) { |
| if (!stripWords(processor, fileText, myLexer.getTokenStart(),myLexer.getTokenEnd(),WordOccurrence.Kind.CODE, occurrence)) return; |
| } |
| } |
| |
| myLexer.advance(); |
| } |
| } |
| |
| private static boolean stripWords(final Processor<WordOccurrence> processor, |
| final CharSequence tokenText, |
| int from, |
| int to, |
| final WordOccurrence.Kind kind, |
| WordOccurrence occurrence) { |
| // This code seems strange but it is more effective as Character.isJavaIdentifier_xxx_ is quite costly operation due to unicode |
| int index = from; |
| |
| ScanWordsLoop: |
| while (true) { |
| while (true) { |
| if (index == to) break ScanWordsLoop; |
| char c = tokenText.charAt(index); |
| if ((c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') || (c >= '0' && c <= '9') || |
| (Character.isJavaIdentifierStart(c) && c != '$')) { |
| break; |
| } |
| index++; |
| } |
| int index1 = index; |
| while (true) { |
| index++; |
| if (index == to) break; |
| char c = tokenText.charAt(index); |
| if ((c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') || (c >= '0' && c <= '9')) continue; |
| if (!Character.isJavaIdentifierPart(c) || c == '$') break; |
| } |
| |
| if (occurrence == null) occurrence = new WordOccurrence(tokenText,index1, index, kind); |
| else occurrence.init(tokenText,index1, index, kind); |
| if (!processor.process(occurrence)) return false; |
| } |
| return true; |
| } |
| } |