| /* |
| * Copyright 2000-2013 JetBrains s.r.o. |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| package com.intellij.spellchecker.inspections; |
| |
| import com.intellij.openapi.util.TextRange; |
| import com.intellij.openapi.util.text.StringUtil; |
| import com.intellij.util.Consumer; |
| import org.jetbrains.annotations.NotNull; |
| import org.jetbrains.annotations.Nullable; |
| |
| import java.util.regex.Matcher; |
| import java.util.regex.Pattern; |
| |
| public class TextSplitter extends BaseSplitter { |
| private static final TextSplitter INSTANCE = new TextSplitter(); |
| |
| public static TextSplitter getInstance() { |
| return INSTANCE; |
| } |
| |
| private static final Pattern EXTENDED_WORD_AND_SPECIAL = Pattern.compile("([&#]|0x[0-9]*)?\\p{L}+'?\\p{L}[_\\p{L}]*"); |
| |
| @Override |
| public void split(@Nullable String text, @NotNull TextRange range, Consumer<TextRange> consumer) { |
| if (text == null || StringUtil.isEmpty(text)) { |
| return; |
| } |
| doSplit(text, range, consumer); |
| } |
| |
| protected void doSplit(@NotNull String text, @NotNull TextRange range, Consumer<TextRange> consumer) { |
| final WordSplitter ws = WordSplitter.getInstance(); |
| Matcher matcher = EXTENDED_WORD_AND_SPECIAL.matcher(text); |
| matcher.region(range.getStartOffset(), range.getEndOffset()); |
| while (matcher.find()) { |
| TextRange found = new TextRange(matcher.start(), matcher.end()); |
| ws.split(text, found, consumer); |
| } |
| } |
| } |