176f614720db6a282c3e890969a600585122cdcc5Marc Blank/*
276f614720db6a282c3e890969a600585122cdcc5Marc Blank * Copyright (C) 2010 The Android Open Source Project
376f614720db6a282c3e890969a600585122cdcc5Marc Blank *
476f614720db6a282c3e890969a600585122cdcc5Marc Blank * Licensed under the Apache License, Version 2.0 (the "License");
576f614720db6a282c3e890969a600585122cdcc5Marc Blank * you may not use this file except in compliance with the License.
676f614720db6a282c3e890969a600585122cdcc5Marc Blank * You may obtain a copy of the License at
776f614720db6a282c3e890969a600585122cdcc5Marc Blank *
876f614720db6a282c3e890969a600585122cdcc5Marc Blank *      http://www.apache.org/licenses/LICENSE-2.0
976f614720db6a282c3e890969a600585122cdcc5Marc Blank *
1076f614720db6a282c3e890969a600585122cdcc5Marc Blank * Unless required by applicable law or agreed to in writing, software
1176f614720db6a282c3e890969a600585122cdcc5Marc Blank * distributed under the License is distributed on an "AS IS" BASIS,
1276f614720db6a282c3e890969a600585122cdcc5Marc Blank * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
1376f614720db6a282c3e890969a600585122cdcc5Marc Blank * See the License for the specific language governing permissions and
1476f614720db6a282c3e890969a600585122cdcc5Marc Blank * limitations under the License.
1576f614720db6a282c3e890969a600585122cdcc5Marc Blank */
1676f614720db6a282c3e890969a600585122cdcc5Marc Blank
1776f614720db6a282c3e890969a600585122cdcc5Marc Blank/**
1876f614720db6a282c3e890969a600585122cdcc5Marc Blank * This is a series of unit tests for snippet creation and highlighting
1976f614720db6a282c3e890969a600585122cdcc5Marc Blank *
2076f614720db6a282c3e890969a600585122cdcc5Marc Blank * You can run this entire test case with:
2176f614720db6a282c3e890969a600585122cdcc5Marc Blank *   runtest -c com.android.emailcommon.utility.TextUtilitiesTests email
2276f614720db6a282c3e890969a600585122cdcc5Marc Blank */
2376f614720db6a282c3e890969a600585122cdcc5Marc Blankpackage com.android.emailcommon.utility;
2476f614720db6a282c3e890969a600585122cdcc5Marc Blank
2576f614720db6a282c3e890969a600585122cdcc5Marc Blankimport android.test.AndroidTestCase;
2676f614720db6a282c3e890969a600585122cdcc5Marc Blankimport android.text.SpannableStringBuilder;
2776f614720db6a282c3e890969a600585122cdcc5Marc Blankimport android.text.style.BackgroundColorSpan;
2876f614720db6a282c3e890969a600585122cdcc5Marc Blank
2976f614720db6a282c3e890969a600585122cdcc5Marc Blankpublic class TextUtilitiesTests extends AndroidTestCase {
3076f614720db6a282c3e890969a600585122cdcc5Marc Blank
3176f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testPlainSnippet() {
3276f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test the simplest cases
3376f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("", TextUtilities.makeSnippetFromPlainText(null));
3476f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("", TextUtilities.makeSnippetFromPlainText(""));
3576f614720db6a282c3e890969a600585122cdcc5Marc Blank
3676f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test handling leading, trailing, and duplicated whitespace
3776f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Just test common whitespace characters; we calls Character.isWhitespace() internally, so
3876f614720db6a282c3e890969a600585122cdcc5Marc Blank        // other whitespace should be fine as well
3976f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("", TextUtilities.makeSnippetFromPlainText(" \n\r\t\r\t\n"));
4076f614720db6a282c3e890969a600585122cdcc5Marc Blank        char c = TextUtilities.NON_BREAKING_SPACE_CHARACTER;
4176f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("foo", TextUtilities.makeSnippetFromPlainText(c + "\r\n\tfoo \n\t\r" + c));
4276f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("foo bar",
4376f614720db6a282c3e890969a600585122cdcc5Marc Blank                TextUtilities.makeSnippetFromPlainText(c + "\r\n\tfoo \r\n bar\n\t\r" + c));
4476f614720db6a282c3e890969a600585122cdcc5Marc Blank
4576f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Handle duplicated - and =
4676f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("Foo-Bar=Bletch",
4776f614720db6a282c3e890969a600585122cdcc5Marc Blank                TextUtilities.makeSnippetFromPlainText("Foo-----Bar=======Bletch"));
4876f614720db6a282c3e890969a600585122cdcc5Marc Blank
4976f614720db6a282c3e890969a600585122cdcc5Marc Blank        // We shouldn't muck with HTML entities
5076f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(" >", TextUtilities.makeSnippetFromPlainText(" >"));
5176f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
5276f614720db6a282c3e890969a600585122cdcc5Marc Blank
5376f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testHtmlSnippet() {
5476f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test the simplest cases
5576f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("", TextUtilities.makeSnippetFromHtmlText(null));
5676f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("", TextUtilities.makeSnippetFromHtmlText(""));
5776f614720db6a282c3e890969a600585122cdcc5Marc Blank
5876f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test handling leading, trailing, and duplicated whitespace
5976f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Just test common whitespace characters; we calls Character.isWhitespace() internally, so
6076f614720db6a282c3e890969a600585122cdcc5Marc Blank        // other whitespace should be fine as well
6176f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("", TextUtilities.makeSnippetFromHtmlText(" \n\r\t\r\t\n"));
6276f614720db6a282c3e890969a600585122cdcc5Marc Blank        char c = TextUtilities.NON_BREAKING_SPACE_CHARACTER;
6376f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("foo", TextUtilities.makeSnippetFromHtmlText(c + "\r\n\tfoo \n\t\r" + c));
6476f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("foo bar",
6576f614720db6a282c3e890969a600585122cdcc5Marc Blank                TextUtilities.makeSnippetFromHtmlText(c + "\r\n\tfoo \r\n bar\n\t\r" + c));
6676f614720db6a282c3e890969a600585122cdcc5Marc Blank
6776f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Handle duplicated - and =
6876f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("Foo-Bar=Bletch",
6976f614720db6a282c3e890969a600585122cdcc5Marc Blank                TextUtilities.makeSnippetFromPlainText("Foo-----Bar=======Bletch"));
7076f614720db6a282c3e890969a600585122cdcc5Marc Blank
7176f614720db6a282c3e890969a600585122cdcc5Marc Blank        // We should catch HTML entities in these tests
7276f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(">", TextUtilities.makeSnippetFromHtmlText(" >"));
7376f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("&<> \"", TextUtilities.makeSnippetFromHtmlText("&amp;&lt;&gt;&nbsp;&quot;"));
7476f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test for decimal and hex entities
7576f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("ABC", TextUtilities.makeSnippetFromHtmlText("&#65;&#66;&#67;"));
7676f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("ABC", TextUtilities.makeSnippetFromHtmlText("&#x41;&#x42;&#x43;"));
7776f614720db6a282c3e890969a600585122cdcc5Marc Blank
7876f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test for stripping simple tags
7976f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("Hi there", TextUtilities.makeSnippetFromHtmlText("<html>Hi there</html>"));
8076f614720db6a282c3e890969a600585122cdcc5Marc Blank        // TODO: Add tests here if/when we find problematic HTML
8176f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
8276f614720db6a282c3e890969a600585122cdcc5Marc Blank
8376f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testStripHtmlEntityEdgeCases() {
8476f614720db6a282c3e890969a600585122cdcc5Marc Blank        int[] skipCount = new int[1];
8576f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Bare & isn't an entity
8676f614720db6a282c3e890969a600585122cdcc5Marc Blank        char c = TextUtilities.stripHtmlEntity("&", 0, skipCount);
8776f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(c, '&');
8876f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(0, skipCount[0]);
8976f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Also not legal
9076f614720db6a282c3e890969a600585122cdcc5Marc Blank        c = TextUtilities.stripHtmlEntity("&;", 0, skipCount);
9176f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(c, '&');
9276f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(0, skipCount[0]);
9376f614720db6a282c3e890969a600585122cdcc5Marc Blank        // This is an entity, but shouldn't be found
9476f614720db6a282c3e890969a600585122cdcc5Marc Blank        c = TextUtilities.stripHtmlEntity("&nosuch;", 0, skipCount);
9576f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(c, '&');
9676f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(0, skipCount[0]);
9776f614720db6a282c3e890969a600585122cdcc5Marc Blank        // This is too long for an entity, even though it starts like a valid one
9876f614720db6a282c3e890969a600585122cdcc5Marc Blank        c = TextUtilities.stripHtmlEntity("&nbspandmore;", 0, skipCount);
9976f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(c, '&');
10076f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(0, skipCount[0]);
10176f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Illegal decimal entities
10276f614720db6a282c3e890969a600585122cdcc5Marc Blank        c = TextUtilities.stripHtmlEntity("&#ABC", 0, skipCount);
10376f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(c, '&');
10476f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(0, skipCount[0]);
10576f614720db6a282c3e890969a600585122cdcc5Marc Blank        c = TextUtilities.stripHtmlEntity("&#12B", 0, skipCount);
10676f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(c, '&');
10776f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(0, skipCount[0]);
10876f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Illegal hex entities
10976f614720db6a282c3e890969a600585122cdcc5Marc Blank        c = TextUtilities.stripHtmlEntity("&#xABC", 0, skipCount);
11076f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(c, '&');
11176f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(0, skipCount[0]);
11276f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Illegal hex entities
11376f614720db6a282c3e890969a600585122cdcc5Marc Blank        c = TextUtilities.stripHtmlEntity("&#x19G", 0, skipCount);
11476f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(c, '&');
11576f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(0, skipCount[0]);
11676f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
11776f614720db6a282c3e890969a600585122cdcc5Marc Blank
11876f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testStripContent() {
11976f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("Visible", TextUtilities.makeSnippetFromHtmlText(
12076f614720db6a282c3e890969a600585122cdcc5Marc Blank            "<html><style foo=\"bar\">Not</style>Visible</html>"));
12176f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("Visible", TextUtilities.makeSnippetFromHtmlText(
12276f614720db6a282c3e890969a600585122cdcc5Marc Blank            "<html><STYLE foo=\"bar\">Not</STYLE>Visible</html>"));
12376f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("IsVisible", TextUtilities.makeSnippetFromHtmlText(
12476f614720db6a282c3e890969a600585122cdcc5Marc Blank            "<html><nostrip foo=\"bar\">Is</nostrip>Visible</html>"));
12576f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("Visible", TextUtilities.makeSnippetFromHtmlText(
12676f614720db6a282c3e890969a600585122cdcc5Marc Blank            "<html>Visible<style foo=\"bar\">Not"));
12776f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("VisibleAgainVisible", TextUtilities.makeSnippetFromHtmlText(
12876f614720db6a282c3e890969a600585122cdcc5Marc Blank            "<html>Visible<style foo=\"bar\">Not</style>AgainVisible"));
12976f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("VisibleAgainVisible", TextUtilities.makeSnippetFromHtmlText(
13076f614720db6a282c3e890969a600585122cdcc5Marc Blank            "<html>Visible<style foo=\"bar\"/>AgainVisible"));
13176f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("VisibleAgainVisible", TextUtilities.makeSnippetFromHtmlText(
13276f614720db6a282c3e890969a600585122cdcc5Marc Blank            "<html>Visible<style foo=\"bar\"/><head><//blah<style>Not</head>AgainVisible"));
13376f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
13476f614720db6a282c3e890969a600585122cdcc5Marc Blank
13576f614720db6a282c3e890969a600585122cdcc5Marc Blank    /**
13676f614720db6a282c3e890969a600585122cdcc5Marc Blank     * We pass in HTML text in which an ampersand (@) is two chars ahead of the correct end position
13776f614720db6a282c3e890969a600585122cdcc5Marc Blank     * for the tag named 'tag' and then check whether the calculated end position matches the known
13876f614720db6a282c3e890969a600585122cdcc5Marc Blank     * correct position.  HTML text not containing an ampersand should generate a calculated end of
13976f614720db6a282c3e890969a600585122cdcc5Marc Blank     * -1
14076f614720db6a282c3e890969a600585122cdcc5Marc Blank     * @param text the HTML text to test
14176f614720db6a282c3e890969a600585122cdcc5Marc Blank     */
14276f614720db6a282c3e890969a600585122cdcc5Marc Blank    private void findTagEnd(String text, String tag) {
14376f614720db6a282c3e890969a600585122cdcc5Marc Blank        int calculatedEnd = TextUtilities.findTagEnd(text , tag, 0);
14476f614720db6a282c3e890969a600585122cdcc5Marc Blank        int knownEnd = text.indexOf('@') + 2;
14576f614720db6a282c3e890969a600585122cdcc5Marc Blank        if (knownEnd == 1) {
14676f614720db6a282c3e890969a600585122cdcc5Marc Blank            // indexOf will return -1, so we'll get 1 as knownEnd
14776f614720db6a282c3e890969a600585122cdcc5Marc Blank            assertEquals(-1, calculatedEnd);
14876f614720db6a282c3e890969a600585122cdcc5Marc Blank        } else {
14976f614720db6a282c3e890969a600585122cdcc5Marc Blank            assertEquals(calculatedEnd, knownEnd);
15076f614720db6a282c3e890969a600585122cdcc5Marc Blank        }
15176f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
15276f614720db6a282c3e890969a600585122cdcc5Marc Blank
15376f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testFindTagEnd() {
15476f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test with <tag ... />
15576f614720db6a282c3e890969a600585122cdcc5Marc Blank        findTagEnd("<tag foo=\"bar\"@ /> <blah blah>", "tag");
15676f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test with <tag ...> ... </tag>
15776f614720db6a282c3e890969a600585122cdcc5Marc Blank        findTagEnd("<tag foo=\"bar\">some text@</tag>some more text", "tag");
15876f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test with incomplete tag
15976f614720db6a282c3e890969a600585122cdcc5Marc Blank        findTagEnd("<tag foo=\"bar\">some more text but no end tag", "tag");
16076f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test with space at end of tag
16176f614720db6a282c3e890969a600585122cdcc5Marc Blank        findTagEnd("<tag foo=\"bar\">some more text but no end tag", "tag ");
16276f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
16376f614720db6a282c3e890969a600585122cdcc5Marc Blank
16476f614720db6a282c3e890969a600585122cdcc5Marc Blank    private void assertHighlightUnchanged(String str) {
16576f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(str, TextUtilities.highlightTermsInHtml(str, null));
16676f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
16776f614720db6a282c3e890969a600585122cdcc5Marc Blank
16876f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testHighlightNoTerm() {
16976f614720db6a282c3e890969a600585122cdcc5Marc Blank        // With no search terms, the html should be unchanged
17076f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertHighlightUnchanged("<html><style foo=\"bar\">Not</style>Visible</html>");
17176f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertHighlightUnchanged("<html><nostrip foo=\"bar\">Is</nostrip>Visible</html>");
17276f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertHighlightUnchanged("<html>Visible<style foo=\"bar\">Not");
17376f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertHighlightUnchanged("<html>Visible<style foo=\"bar\">Not</style>AgainVisible");
17476f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertHighlightUnchanged("<html>Visible<style foo=\"bar\"/>AgainVisible");
17576f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertHighlightUnchanged(
17676f614720db6a282c3e890969a600585122cdcc5Marc Blank                "<html>Visible<style foo=\"bar\"/><head><//blah<style>Not</head>AgainVisible");
17776f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
17876f614720db6a282c3e890969a600585122cdcc5Marc Blank
17976f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testHighlightSingleTermHtml() {
18076f614720db6a282c3e890969a600585122cdcc5Marc Blank        String str = "<html><style foo=\"bar\">Not</style>Visible</html>";
18176f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test that tags aren't highlighted
18276f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(str, TextUtilities.highlightTermsInHtml(
18376f614720db6a282c3e890969a600585122cdcc5Marc Blank                "<html><style foo=\"bar\">Not</style>Visible</html>", "style"));
18476f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Test that non-tags are
18576f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("<html><style foo=\"bar\">Not</style><span " +
18676f614720db6a282c3e890969a600585122cdcc5Marc Blank                "style=\"background-color: " + TextUtilities.HIGHLIGHT_COLOR_STRING +
18776f614720db6a282c3e890969a600585122cdcc5Marc Blank                "\">Visi</span>ble</html>",
18876f614720db6a282c3e890969a600585122cdcc5Marc Blank                TextUtilities.highlightTermsInHtml(str, "Visi"));
18976f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals("<html>Visible<style foo=\"bar\">Not</style>A<span" +
19076f614720db6a282c3e890969a600585122cdcc5Marc Blank                " style=\"background-color: " + TextUtilities.HIGHLIGHT_COLOR_STRING +
19176f614720db6a282c3e890969a600585122cdcc5Marc Blank                "\">gain</span>Visible",
19276f614720db6a282c3e890969a600585122cdcc5Marc Blank                TextUtilities.highlightTermsInHtml(
19376f614720db6a282c3e890969a600585122cdcc5Marc Blank                        "<html>Visible<style foo=\"bar\">Not</style>AgainVisible", "gain"));
19476f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
19576f614720db6a282c3e890969a600585122cdcc5Marc Blank
19676f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testHighlightSingleTermText() {
19776f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Sprinkle text with a few HTML characters to make sure they're ignored
19876f614720db6a282c3e890969a600585122cdcc5Marc Blank        String text = "This< should be visibl>e";
19976f614720db6a282c3e890969a600585122cdcc5Marc Blank        // We should find this, because search terms are case insensitive
20076f614720db6a282c3e890969a600585122cdcc5Marc Blank        SpannableStringBuilder ssb =
20176f614720db6a282c3e890969a600585122cdcc5Marc Blank            (SpannableStringBuilder)TextUtilities.highlightTermsInText(text, "Visi");
20276f614720db6a282c3e890969a600585122cdcc5Marc Blank        BackgroundColorSpan[] spans = ssb.getSpans(0, ssb.length(), BackgroundColorSpan.class);
20376f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(1, spans.length);
20476f614720db6a282c3e890969a600585122cdcc5Marc Blank        BackgroundColorSpan span = spans[0];
20576f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("visi"), ssb.getSpanStart(span));
20676f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("bl>e"), ssb.getSpanEnd(span));
20776f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Heh; this next test fails.. we use the search term!
20876f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text, ssb.toString());
20976f614720db6a282c3e890969a600585122cdcc5Marc Blank
21076f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Multiple instances of the term
21176f614720db6a282c3e890969a600585122cdcc5Marc Blank        text = "The research word should be a search result";
21276f614720db6a282c3e890969a600585122cdcc5Marc Blank        ssb = (SpannableStringBuilder)TextUtilities.highlightTermsInText(text, "Search");
21376f614720db6a282c3e890969a600585122cdcc5Marc Blank        spans = ssb.getSpans(0, ssb.length(), BackgroundColorSpan.class);
21476f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(2, spans.length);
21576f614720db6a282c3e890969a600585122cdcc5Marc Blank        span = spans[0];
21676f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("search word"), ssb.getSpanStart(span));
21776f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf(" word"), ssb.getSpanEnd(span));
21876f614720db6a282c3e890969a600585122cdcc5Marc Blank        span = spans[1];
21976f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("search result"), ssb.getSpanStart(span));
22076f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf(" result"), ssb.getSpanEnd(span));
22176f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text, ssb.toString());
22276f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
22376f614720db6a282c3e890969a600585122cdcc5Marc Blank
22476f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testHighlightTwoTermText() {
22576f614720db6a282c3e890969a600585122cdcc5Marc Blank        String text = "This should be visible";
22676f614720db6a282c3e890969a600585122cdcc5Marc Blank        // We should find this, because search terms are case insensitive
22776f614720db6a282c3e890969a600585122cdcc5Marc Blank        SpannableStringBuilder ssb =
22876f614720db6a282c3e890969a600585122cdcc5Marc Blank            (SpannableStringBuilder)TextUtilities.highlightTermsInText(text, "visi should");
22976f614720db6a282c3e890969a600585122cdcc5Marc Blank        BackgroundColorSpan[] spans = ssb.getSpans(0, ssb.length(), BackgroundColorSpan.class);
23076f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(2, spans.length);
23176f614720db6a282c3e890969a600585122cdcc5Marc Blank        BackgroundColorSpan span = spans[0];
23276f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("should"), ssb.getSpanStart(span));
23376f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf(" be"), ssb.getSpanEnd(span));
23476f614720db6a282c3e890969a600585122cdcc5Marc Blank        span = spans[1];
23576f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("visi"), ssb.getSpanStart(span));
23676f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("ble"), ssb.getSpanEnd(span));
23776f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text, ssb.toString());
23876f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
23976f614720db6a282c3e890969a600585122cdcc5Marc Blank
24076f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testHighlightDuplicateTermText() {
24176f614720db6a282c3e890969a600585122cdcc5Marc Blank        String text = "This should be visible";
24276f614720db6a282c3e890969a600585122cdcc5Marc Blank        // We should find this, because search terms are case insensitive
24376f614720db6a282c3e890969a600585122cdcc5Marc Blank        SpannableStringBuilder ssb =
24476f614720db6a282c3e890969a600585122cdcc5Marc Blank            (SpannableStringBuilder)TextUtilities.highlightTermsInText(text, "should should");
24576f614720db6a282c3e890969a600585122cdcc5Marc Blank        BackgroundColorSpan[] spans = ssb.getSpans(0, ssb.length(), BackgroundColorSpan.class);
24676f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(1, spans.length);
24776f614720db6a282c3e890969a600585122cdcc5Marc Blank        BackgroundColorSpan span = spans[0];
24876f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("should"), ssb.getSpanStart(span));
24976f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf(" be"), ssb.getSpanEnd(span));
25076f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
25176f614720db6a282c3e890969a600585122cdcc5Marc Blank
25276f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testHighlightOverlapTermText() {
25376f614720db6a282c3e890969a600585122cdcc5Marc Blank        String text = "This shoulder is visible";
25476f614720db6a282c3e890969a600585122cdcc5Marc Blank        // We should find this, because search terms are case insensitive
25576f614720db6a282c3e890969a600585122cdcc5Marc Blank        SpannableStringBuilder ssb =
25676f614720db6a282c3e890969a600585122cdcc5Marc Blank            (SpannableStringBuilder)TextUtilities.highlightTermsInText(text, "should ould");
25776f614720db6a282c3e890969a600585122cdcc5Marc Blank        BackgroundColorSpan[] spans = ssb.getSpans(0, ssb.length(), BackgroundColorSpan.class);
25876f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(1, spans.length);
25976f614720db6a282c3e890969a600585122cdcc5Marc Blank        BackgroundColorSpan span = spans[0];
26076f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("should"), ssb.getSpanStart(span));
26176f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("er is"), ssb.getSpanEnd(span));
26276f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
26376f614720db6a282c3e890969a600585122cdcc5Marc Blank
26476f614720db6a282c3e890969a600585122cdcc5Marc Blank
26576f614720db6a282c3e890969a600585122cdcc5Marc Blank    public void testHighlightOverlapTermText2() {
26676f614720db6a282c3e890969a600585122cdcc5Marc Blank        String text = "The shoulders are visible";
26776f614720db6a282c3e890969a600585122cdcc5Marc Blank        // We should find this, because search terms are case insensitive
26876f614720db6a282c3e890969a600585122cdcc5Marc Blank        SpannableStringBuilder ssb =
26976f614720db6a282c3e890969a600585122cdcc5Marc Blank            (SpannableStringBuilder)TextUtilities.highlightTermsInText(text, "shoulder shoulders");
27076f614720db6a282c3e890969a600585122cdcc5Marc Blank        BackgroundColorSpan[] spans = ssb.getSpans(0, ssb.length(), BackgroundColorSpan.class);
27176f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(2, spans.length);
27276f614720db6a282c3e890969a600585122cdcc5Marc Blank        BackgroundColorSpan span = spans[0];
27376f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("shoulder"), ssb.getSpanStart(span));
27476f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("s are visible"), ssb.getSpanEnd(span));
27576f614720db6a282c3e890969a600585122cdcc5Marc Blank        span = spans[1];
27676f614720db6a282c3e890969a600585122cdcc5Marc Blank        // Just the 's' should be caught in the 2nd span
27776f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf("s are visible"), ssb.getSpanStart(span));
27876f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text.indexOf(" are visible"), ssb.getSpanEnd(span));
27976f614720db6a282c3e890969a600585122cdcc5Marc Blank        assertEquals(text, ssb.toString());
28076f614720db6a282c3e890969a600585122cdcc5Marc Blank    }
28176f614720db6a282c3e890969a600585122cdcc5Marc Blank    // For debugging large HTML samples
28276f614720db6a282c3e890969a600585122cdcc5Marc Blank
28376f614720db6a282c3e890969a600585122cdcc5Marc Blank//    private String readLargeSnippet(String fn) {
28476f614720db6a282c3e890969a600585122cdcc5Marc Blank//        File file = mContext.getFileStreamPath(fn);
28576f614720db6a282c3e890969a600585122cdcc5Marc Blank//        StringBuffer sb = new StringBuffer();
28676f614720db6a282c3e890969a600585122cdcc5Marc Blank//        BufferedReader reader = null;
28776f614720db6a282c3e890969a600585122cdcc5Marc Blank//        try {
28876f614720db6a282c3e890969a600585122cdcc5Marc Blank//            String text;
28976f614720db6a282c3e890969a600585122cdcc5Marc Blank//            reader = new BufferedReader(new FileReader(file));
29076f614720db6a282c3e890969a600585122cdcc5Marc Blank//            while ((text = reader.readLine()) != null) {
29176f614720db6a282c3e890969a600585122cdcc5Marc Blank//                sb.append(text);
29276f614720db6a282c3e890969a600585122cdcc5Marc Blank//                sb.append(" ");
29376f614720db6a282c3e890969a600585122cdcc5Marc Blank//            }
29476f614720db6a282c3e890969a600585122cdcc5Marc Blank//        } catch (IOException e) {
29576f614720db6a282c3e890969a600585122cdcc5Marc Blank//        }
29676f614720db6a282c3e890969a600585122cdcc5Marc Blank//        return sb.toString();
29776f614720db6a282c3e890969a600585122cdcc5Marc Blank//    }
29876f614720db6a282c3e890969a600585122cdcc5Marc Blank }
299