blob: 16ca12608f4574de9abc68c6423befb11ecf04e2 [file] [log] [blame]
package org.apache.harmony.regex.tests.java.util.regex;
import junit.framework.TestCase;
import java.util.regex.*;
/**
* TODO Type description
*
*/
public class SplitTest extends TestCase {
public void testSimple() {
Pattern p = Pattern.compile("/");
String[] results = p.split("have/you/done/it/right");
String[] expected = new String[] { "have", "you", "done", "it", "right" };
assertArraysEqual(expected, results);
}
public void testEmptySplits() {
// Trailing empty matches are removed.
assertArraysEqual(new String[0], "hello".split("."));
assertArraysEqual(new String[] { "1", "2" }, "1:2:".split(":"));
// ...including when that results in an empty result.
assertArraysEqual(new String[0], ":".split(":"));
// ...but not when limit < 0.
assertArraysEqual(new String[] { "1", "2", "" }, "1:2:".split(":", -1));
// Leading empty matches are retained.
assertArraysEqual(new String[] { "", "", "o" }, "hello".split(".."));
// A separator that doesn't occur in the input gets you the input.
assertArraysEqual(new String[] { "hello" }, "hello".split("not-present-in-test"));
// ...including when the input is the empty string.
// (Perl returns an empty list instead.)
assertArraysEqual(new String[] { "" }, "".split("not-present-in-test"));
assertArraysEqual(new String[] { "" }, "".split("A?"));
// The limit argument controls the size of the result.
// If l == 0, the result is as long as needed, except trailing empty matches are dropped.
// If l < 0, the result is as long as needed, and trailing empty matches are retained.
// If l > 0, the result contains the first l matches, plus one string containing the remaining input.
// Examples without a trailing separator (and hence without a trailing empty match):
assertArraysEqual(new String[] { "a", "b", "c" }, "a,b,c".split(",", 0));
assertArraysEqual(new String[] { "a,b,c" }, "a,b,c".split(",", 1));
assertArraysEqual(new String[] { "a", "b,c" }, "a,b,c".split(",", 2));
assertArraysEqual(new String[] { "a", "b", "c" }, "a,b,c".split(",", 3));
assertArraysEqual(new String[] { "a", "b", "c" }, "a,b,c".split(",", Integer.MAX_VALUE));
// Examples with a trailing separator (and hence possibly with a trailing empty match):
assertArraysEqual(new String[] { "a", "b", "c" }, "a,b,c,".split(",", 0));
assertArraysEqual(new String[] { "a,b,c," }, "a,b,c,".split(",", 1));
assertArraysEqual(new String[] { "a", "b,c," }, "a,b,c,".split(",", 2));
assertArraysEqual(new String[] { "a", "b", "c," }, "a,b,c,".split(",", 3));
assertArraysEqual(new String[] { "a", "b", "c", "" }, "a,b,c,".split(",", Integer.MAX_VALUE));
assertArraysEqual(new String[] { "a", "b", "c", "" }, "a,b,c,".split(",", -1));
}
private void assertArraysEqual(String[] expected, String[] actual) {
assertEquals(expected.length, actual.length);
for (int i = 0; i < expected.length; i++) {
assertEquals(Integer.toString(i), expected[i], actual[i]);
}
}
public void testSplit1() throws PatternSyntaxException {
Pattern p = Pattern.compile(" ");
String input = "poodle zoo";
String tokens[];
tokens = p.split(input, 1);
assertEquals(1, tokens.length);
assertTrue(tokens[0].equals(input));
tokens = p.split(input, 2);
assertEquals(2, tokens.length);
assertEquals("poodle", tokens[0]);
assertEquals("zoo", tokens[1]);
tokens = p.split(input, 5);
assertEquals(2, tokens.length);
assertEquals("poodle", tokens[0]);
assertEquals("zoo", tokens[1]);
tokens = p.split(input, -2);
assertEquals(2, tokens.length);
assertEquals("poodle", tokens[0]);
assertEquals("zoo", tokens[1]);
tokens = p.split(input, 0);
assertEquals(2, tokens.length);
assertEquals("poodle", tokens[0]);
assertEquals("zoo", tokens[1]);
tokens = p.split(input);
assertEquals(2, tokens.length);
assertEquals("poodle", tokens[0]);
assertEquals("zoo", tokens[1]);
p = Pattern.compile("d");
tokens = p.split(input, 1);
assertEquals(1, tokens.length);
assertTrue(tokens[0].equals(input));
tokens = p.split(input, 2);
assertEquals(2, tokens.length);
assertEquals("poo", tokens[0]);
assertEquals("le zoo", tokens[1]);
tokens = p.split(input, 5);
assertEquals(2, tokens.length);
assertEquals("poo", tokens[0]);
assertEquals("le zoo", tokens[1]);
tokens = p.split(input, -2);
assertEquals(2, tokens.length);
assertEquals("poo", tokens[0]);
assertEquals("le zoo", tokens[1]);
tokens = p.split(input, 0);
assertEquals(2, tokens.length);
assertEquals("poo", tokens[0]);
assertEquals("le zoo", tokens[1]);
tokens = p.split(input);
assertEquals(2, tokens.length);
assertEquals("poo", tokens[0]);
assertEquals("le zoo", tokens[1]);
p = Pattern.compile("o");
tokens = p.split(input, 1);
assertEquals(1, tokens.length);
assertTrue(tokens[0].equals(input));
tokens = p.split(input, 2);
assertEquals(2, tokens.length);
assertEquals("p", tokens[0]);
assertEquals("odle zoo", tokens[1]);
tokens = p.split(input, 5);
assertEquals(5, tokens.length);
assertEquals("p", tokens[0]);
assertTrue(tokens[1].equals(""));
assertEquals("dle z", tokens[2]);
assertTrue(tokens[3].equals(""));
assertTrue(tokens[4].equals(""));
tokens = p.split(input, -2);
assertEquals(5, tokens.length);
assertEquals("p", tokens[0]);
assertTrue(tokens[1].equals(""));
assertEquals("dle z", tokens[2]);
assertTrue(tokens[3].equals(""));
assertTrue(tokens[4].equals(""));
tokens = p.split(input, 0);
assertEquals(3, tokens.length);
assertEquals("p", tokens[0]);
assertTrue(tokens[1].equals(""));
assertEquals("dle z", tokens[2]);
tokens = p.split(input);
assertEquals(3, tokens.length);
assertEquals("p", tokens[0]);
assertTrue(tokens[1].equals(""));
assertEquals("dle z", tokens[2]);
}
public void testSplit2() {
Pattern p = Pattern.compile("");
String s[];
s = p.split("a", -1);
assertEquals(3, s.length);
assertEquals("", s[0]);
assertEquals("a", s[1]);
assertEquals("", s[2]);
s = p.split("", -1);
assertEquals(1, s.length);
assertEquals("", s[0]);
s = p.split("abcd", -1);
assertEquals(6, s.length);
assertEquals("", s[0]);
assertEquals("a", s[1]);
assertEquals("b", s[2]);
assertEquals("c", s[3]);
assertEquals("d", s[4]);
assertEquals("", s[5]);
// Regression test for Android
assertEquals("GOOG,23,500".split("|").length, 12);
}
public void testSplitSupplementaryWithEmptyString() {
/*
* See http://www.unicode.org/reports/tr18/#Supplementary_Characters
* We have to treat text as code points not code units.
*/
Pattern p = Pattern.compile("");
String s[];
s = p.split("a\ud869\uded6b", -1);
assertEquals(5, s.length);
assertEquals("", s[0]);
assertEquals("a", s[1]);
assertEquals("\ud869\uded6", s[2]);
assertEquals("b", s[3]);
assertEquals("", s[4]);
}
}