| /* |
| * Copyright 2000-2011 JetBrains s.r.o. |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| package com.intellij.openapi.util.text; |
| |
| import com.intellij.util.ArrayUtil; |
| import com.intellij.util.text.CharArrayCharSequence; |
| |
| import java.util.ArrayList; |
| import java.util.Collections; |
| import java.util.List; |
| |
| public class LineTokenizer { |
| private int myOffset = 0; |
| private int myLength = 0; |
| private int myLineSeparatorLength = 0; |
| private boolean atEnd = false; |
| private CharSequence myText; |
| |
| public static String[] tokenize(CharSequence chars, boolean includeSeparators) { |
| return tokenize(chars, includeSeparators, true); |
| } |
| |
| private static String[] tokenize(final CharSequence chars, final boolean includeSeparators, final boolean skipLastEmptyLine) { |
| final List<String> strings = tokenizeIntoList(chars, includeSeparators, skipLastEmptyLine); |
| return strings.isEmpty() ? ArrayUtil.EMPTY_STRING_ARRAY : ArrayUtil.toStringArray(strings); |
| } |
| |
| public static List<String> tokenizeIntoList(final CharSequence chars, final boolean includeSeparators) { |
| return tokenizeIntoList(chars, includeSeparators, true); |
| } |
| |
| public static List<String> tokenizeIntoList(final CharSequence chars, final boolean includeSeparators, final boolean skipLastEmptyLine) { |
| if (chars == null || chars.length() == 0){ |
| return Collections.emptyList(); |
| } |
| |
| LineTokenizer tokenizer = new LineTokenizer(chars); |
| List<String> lines = new ArrayList<String>(); |
| while(!tokenizer.atEnd()){ |
| int offset = tokenizer.getOffset(); |
| String line; |
| if (includeSeparators){ |
| line = chars.subSequence(offset, offset + tokenizer.getLength() + tokenizer.getLineSeparatorLength()).toString(); |
| } |
| else{ |
| line = chars.subSequence(offset, offset + tokenizer.getLength()).toString(); |
| } |
| lines.add(line); |
| tokenizer.advance(); |
| } |
| |
| if (!skipLastEmptyLine && stringEndsWithSeparator(tokenizer)) lines.add(""); |
| |
| return lines; |
| } |
| |
| public static int calcLineCount(final CharSequence chars, final boolean skipLastEmptyLine) { |
| int lineCount = 0; |
| if (chars != null && chars.length() != 0) { |
| final LineTokenizer tokenizer = new LineTokenizer(chars); |
| while (!tokenizer.atEnd()) { |
| lineCount += 1; |
| tokenizer.advance(); |
| } |
| if (!skipLastEmptyLine && stringEndsWithSeparator(tokenizer)) { |
| lineCount += 1; |
| } |
| } |
| return lineCount; |
| } |
| |
| public static String[] tokenize(char[] chars, boolean includeSeparators) { |
| return tokenize(chars, includeSeparators, true); |
| } |
| |
| public static String[] tokenize(char[] chars, boolean includeSeparators, boolean skipLastEmptyLine) { |
| return tokenize(chars, 0, chars.length, includeSeparators, skipLastEmptyLine); |
| } |
| |
| public static String[] tokenize(char[] chars, int startOffset, int endOffset, boolean includeSeparators, |
| boolean skipLastEmptyLine) { |
| return tokenize(new CharArrayCharSequence(chars, startOffset, endOffset), includeSeparators, skipLastEmptyLine); |
| } |
| |
| private static boolean stringEndsWithSeparator(LineTokenizer tokenizer) { |
| return tokenizer.getLineSeparatorLength() > 0; |
| } |
| |
| public static String[] tokenize(char[] chars, int startOffset, int endOffset, boolean includeSeparators) { |
| return tokenize(chars, startOffset, endOffset, includeSeparators, true); |
| } |
| |
| public LineTokenizer(CharSequence text) { |
| myText = text; |
| myOffset = 0; |
| advance(); |
| } |
| |
| public LineTokenizer(char[] text, int startOffset, int endOffset) { |
| this(new CharArrayCharSequence(text, startOffset, endOffset)); |
| } |
| |
| public final boolean atEnd() { |
| return atEnd; |
| } |
| |
| public final int getOffset() { |
| return myOffset; |
| } |
| |
| public final int getLength() { |
| return myLength; |
| } |
| |
| public final int getLineSeparatorLength() { |
| return myLineSeparatorLength; |
| } |
| |
| public void advance() { |
| int i = myOffset + myLength + myLineSeparatorLength; |
| final int textLength = myText.length(); |
| if (i >= textLength){ |
| atEnd = true; |
| return; |
| } |
| while(i < textLength){ |
| char c = myText.charAt(i); |
| if (c == '\r' || c == '\n') break; |
| i++; |
| } |
| |
| myOffset = myOffset + myLength + myLineSeparatorLength; |
| myLength = i - myOffset; |
| |
| myLineSeparatorLength = 0; |
| if (i == textLength) return; |
| |
| char first = myText.charAt(i); |
| if (first == '\r' || first == '\n') { |
| myLineSeparatorLength = 1; |
| } |
| |
| i++; |
| if (i == textLength) return; |
| |
| char second = myText.charAt(i); |
| if (first == '\r' && second == '\n') { |
| myLineSeparatorLength = 2; |
| } |
| } |
| } |