| package org.apache.harmony.regex.tests.java.util.regex; |
| |
| import junit.framework.TestCase; |
| import java.util.regex.*; |
| |
| /** |
| * TODO Type description |
| * |
| */ |
| public class SplitTest extends TestCase { |
| public void testSimple() { |
| Pattern p = Pattern.compile("/"); |
| String[] results = p.split("have/you/done/it/right"); |
| String[] expected = new String[] { "have", "you", "done", "it", "right" }; |
| assertArraysEqual(expected, results); |
| } |
| |
| public void testEmptySplits() { |
| // Trailing empty matches are removed. |
| assertArraysEqual(new String[0], "hello".split(".")); |
| assertArraysEqual(new String[] { "1", "2" }, "1:2:".split(":")); |
| // ...including when that results in an empty result. |
| assertArraysEqual(new String[0], ":".split(":")); |
| // ...but not when limit < 0. |
| assertArraysEqual(new String[] { "1", "2", "" }, "1:2:".split(":", -1)); |
| |
| // Leading empty matches are retained. |
| assertArraysEqual(new String[] { "", "", "o" }, "hello".split("..")); |
| |
| // A separator that doesn't occur in the input gets you the input. |
| assertArraysEqual(new String[] { "hello" }, "hello".split("not-present-in-test")); |
| // ...including when the input is the empty string. |
| // (Perl returns an empty list instead.) |
| assertArraysEqual(new String[] { "" }, "".split("not-present-in-test")); |
| assertArraysEqual(new String[] { "" }, "".split("A?")); |
| |
| // The limit argument controls the size of the result. |
| // If l == 0, the result is as long as needed, except trailing empty matches are dropped. |
| // If l < 0, the result is as long as needed, and trailing empty matches are retained. |
| // If l > 0, the result contains the first l matches, plus one string containing the remaining input. |
| // Examples without a trailing separator (and hence without a trailing empty match): |
| assertArraysEqual(new String[] { "a", "b", "c" }, "a,b,c".split(",", 0)); |
| assertArraysEqual(new String[] { "a,b,c" }, "a,b,c".split(",", 1)); |
| assertArraysEqual(new String[] { "a", "b,c" }, "a,b,c".split(",", 2)); |
| assertArraysEqual(new String[] { "a", "b", "c" }, "a,b,c".split(",", 3)); |
| assertArraysEqual(new String[] { "a", "b", "c" }, "a,b,c".split(",", Integer.MAX_VALUE)); |
| // Examples with a trailing separator (and hence possibly with a trailing empty match): |
| assertArraysEqual(new String[] { "a", "b", "c" }, "a,b,c,".split(",", 0)); |
| assertArraysEqual(new String[] { "a,b,c," }, "a,b,c,".split(",", 1)); |
| assertArraysEqual(new String[] { "a", "b,c," }, "a,b,c,".split(",", 2)); |
| assertArraysEqual(new String[] { "a", "b", "c," }, "a,b,c,".split(",", 3)); |
| assertArraysEqual(new String[] { "a", "b", "c", "" }, "a,b,c,".split(",", Integer.MAX_VALUE)); |
| assertArraysEqual(new String[] { "a", "b", "c", "" }, "a,b,c,".split(",", -1)); |
| } |
| |
| private void assertArraysEqual(String[] expected, String[] actual) { |
| assertEquals(expected.length, actual.length); |
| for (int i = 0; i < expected.length; i++) { |
| assertEquals(Integer.toString(i), expected[i], actual[i]); |
| } |
| } |
| |
| public void testSplit1() throws PatternSyntaxException { |
| Pattern p = Pattern.compile(" "); |
| |
| String input = "poodle zoo"; |
| String tokens[]; |
| |
| tokens = p.split(input, 1); |
| assertEquals(1, tokens.length); |
| assertTrue(tokens[0].equals(input)); |
| tokens = p.split(input, 2); |
| assertEquals(2, tokens.length); |
| assertEquals("poodle", tokens[0]); |
| assertEquals("zoo", tokens[1]); |
| tokens = p.split(input, 5); |
| assertEquals(2, tokens.length); |
| assertEquals("poodle", tokens[0]); |
| assertEquals("zoo", tokens[1]); |
| tokens = p.split(input, -2); |
| assertEquals(2, tokens.length); |
| assertEquals("poodle", tokens[0]); |
| assertEquals("zoo", tokens[1]); |
| tokens = p.split(input, 0); |
| assertEquals(2, tokens.length); |
| assertEquals("poodle", tokens[0]); |
| assertEquals("zoo", tokens[1]); |
| tokens = p.split(input); |
| assertEquals(2, tokens.length); |
| assertEquals("poodle", tokens[0]); |
| assertEquals("zoo", tokens[1]); |
| |
| p = Pattern.compile("d"); |
| |
| tokens = p.split(input, 1); |
| assertEquals(1, tokens.length); |
| assertTrue(tokens[0].equals(input)); |
| tokens = p.split(input, 2); |
| assertEquals(2, tokens.length); |
| assertEquals("poo", tokens[0]); |
| assertEquals("le zoo", tokens[1]); |
| tokens = p.split(input, 5); |
| assertEquals(2, tokens.length); |
| assertEquals("poo", tokens[0]); |
| assertEquals("le zoo", tokens[1]); |
| tokens = p.split(input, -2); |
| assertEquals(2, tokens.length); |
| assertEquals("poo", tokens[0]); |
| assertEquals("le zoo", tokens[1]); |
| tokens = p.split(input, 0); |
| assertEquals(2, tokens.length); |
| assertEquals("poo", tokens[0]); |
| assertEquals("le zoo", tokens[1]); |
| tokens = p.split(input); |
| assertEquals(2, tokens.length); |
| assertEquals("poo", tokens[0]); |
| assertEquals("le zoo", tokens[1]); |
| |
| p = Pattern.compile("o"); |
| |
| tokens = p.split(input, 1); |
| assertEquals(1, tokens.length); |
| assertTrue(tokens[0].equals(input)); |
| tokens = p.split(input, 2); |
| assertEquals(2, tokens.length); |
| assertEquals("p", tokens[0]); |
| assertEquals("odle zoo", tokens[1]); |
| tokens = p.split(input, 5); |
| assertEquals(5, tokens.length); |
| assertEquals("p", tokens[0]); |
| assertTrue(tokens[1].equals("")); |
| assertEquals("dle z", tokens[2]); |
| assertTrue(tokens[3].equals("")); |
| assertTrue(tokens[4].equals("")); |
| tokens = p.split(input, -2); |
| assertEquals(5, tokens.length); |
| assertEquals("p", tokens[0]); |
| assertTrue(tokens[1].equals("")); |
| assertEquals("dle z", tokens[2]); |
| assertTrue(tokens[3].equals("")); |
| assertTrue(tokens[4].equals("")); |
| tokens = p.split(input, 0); |
| assertEquals(3, tokens.length); |
| assertEquals("p", tokens[0]); |
| assertTrue(tokens[1].equals("")); |
| assertEquals("dle z", tokens[2]); |
| tokens = p.split(input); |
| assertEquals(3, tokens.length); |
| assertEquals("p", tokens[0]); |
| assertTrue(tokens[1].equals("")); |
| assertEquals("dle z", tokens[2]); |
| } |
| |
| public void testSplit2() { |
| Pattern p = Pattern.compile(""); |
| String s[]; |
| s = p.split("a", -1); |
| assertEquals(3, s.length); |
| assertEquals("", s[0]); |
| assertEquals("a", s[1]); |
| assertEquals("", s[2]); |
| |
| s = p.split("", -1); |
| assertEquals(1, s.length); |
| assertEquals("", s[0]); |
| |
| s = p.split("abcd", -1); |
| assertEquals(6, s.length); |
| assertEquals("", s[0]); |
| assertEquals("a", s[1]); |
| assertEquals("b", s[2]); |
| assertEquals("c", s[3]); |
| assertEquals("d", s[4]); |
| assertEquals("", s[5]); |
| |
| // Regression test for Android |
| assertEquals("GOOG,23,500".split("|").length, 12); |
| } |
| |
| |
| public void testSplitSupplementaryWithEmptyString() { |
| |
| /* |
| * See http://www.unicode.org/reports/tr18/#Supplementary_Characters |
| * We have to treat text as code points not code units. |
| */ |
| Pattern p = Pattern.compile(""); |
| String s[]; |
| s = p.split("a\ud869\uded6b", -1); |
| assertEquals(5, s.length); |
| assertEquals("", s[0]); |
| assertEquals("a", s[1]); |
| assertEquals("\ud869\uded6", s[2]); |
| assertEquals("b", s[3]); |
| assertEquals("", s[4]); |
| } |
| } |