tests/functional/text-wordbreak-test.js

	text-wordbreak-test.js revision cc70141342b8690e43bef6d8cef0c38fcfba8227
YUI.add('text-wordbreak-test', function (Y) {

var Assert      = Y.Assert,
    ArrayAssert = Y.ArrayAssert,
    WB          = Y.Text.WordBreak;

Y.Test.Runner.add(new Y.Test.Case({
    name: 'Text.WordBreak',

    // -- isWordBoundary() -----------------------------------------------------
    'isWordBoundary() should not break between most letters': function () {
        Assert.isFalse(WB.isWordBoundary('aaa', 1));
        Assert.isFalse(WB.isWordBoundary('áåä', 1));
        Assert.isFalse(WB.isWordBoundary('aäa', 1));
    },

    'isWordBoundary() should not break letters across certain punctuation': function () {
        Assert.isFalse(WB.isWordBoundary("can't", 2));
        Assert.isFalse(WB.isWordBoundary("can’t", 2));
        Assert.isFalse(WB.isWordBoundary('foo.bar', 2));
        Assert.isFalse(WB.isWordBoundary('foo:bar', 2));
    },

    'isWordBoundary() should not break across sequences of digits or digits adjacent to letters': function () {
        Assert.isFalse(WB.isWordBoundary('123', 1));
        Assert.isFalse(WB.isWordBoundary('a123', 1));
        Assert.isFalse(WB.isWordBoundary('1a23', 1));
    },

    'isWordBoundary() should not break inside numeric sequences': function () {
        Assert.isFalse(WB.isWordBoundary('3.14', 1));
        Assert.isFalse(WB.isWordBoundary('1,024', 1));
    },

    'isWordBoundary() should ignore format and extend characters': function () {
        Assert.isFalse(WB.isWordBoundary('foo\u00ADbar', 2));
        Assert.isFalse(WB.isWordBoundary('foo\u0300bar', 2));
    },

    'isWordBoundary() should not break inside CRLF': function () {
        Assert.isFalse(WB.isWordBoundary('foo\r\nbar', 3));
    },

    'isWordBoundary() should break before newlines': function () {
        Assert.isTrue(WB.isWordBoundary('foo\rbar', 2));
        Assert.isTrue(WB.isWordBoundary('foo\nbar', 2));
        Assert.isTrue(WB.isWordBoundary('foo\r\nbar', 2));
    },

    'isWordBoundary() should break after newlines': function () {
        Assert.isTrue(WB.isWordBoundary('foo\rbar', 3));
        Assert.isTrue(WB.isWordBoundary('foo\nbar', 3));
        Assert.isTrue(WB.isWordBoundary('foo\r\nbar', 4));
    },

    'isWordBoundary() should not break between Katakana characters': function () {
        Assert.isFalse(WB.isWordBoundary('パイ', 0));
    },

    'isWordBoundary() should not break from extenders': function () {
        Assert.isFalse(WB.isWordBoundary('foo_bar', 2));
        Assert.isFalse(WB.isWordBoundary('__', 0));
    },

    'isWordBoundary() should break everywhere else': function () {
        Assert.isTrue(WB.isWordBoundary('foo bar', 2));
        Assert.isTrue(WB.isWordBoundary('foo\tbar', 2));
        Assert.isTrue(WB.isWordBoundary('foo&bar', 2));
        Assert.isTrue(WB.isWordBoundary('foo"bar"', 2));
        Assert.isTrue(WB.isWordBoundary('foo(bar)', 2));
        Assert.isTrue(WB.isWordBoundary('foo/bar', 2));
    },

    // -- getWords() -----------------------------------------------------------
    'getWords() should split a string into words': function () {
        // Also tests default exclusion of whitespace.
        ArrayAssert.itemsAreSame(['foo', 'bar', 'baz'], WB.getWords('foo bar baz'));
        ArrayAssert.itemsAreSame(['パイ', 'が', '良', 'い', 'で', 'す'], WB.getWords('パイが良いです'));
    },

    'getWords() should preserve case by default': function () {
        ArrayAssert.itemsAreSame(['foo', 'BAR', 'baz'], WB.getWords('foo BAR baz'));
    },

    'getWords() should support an ignoreCase option': function () {
        ArrayAssert.itemsAreSame(['foo', 'bar'], WB.getWords('Foo Bar', {ignoreCase: true}));
    },

    'getWords() should exclude punctuation-only words by default': function () {
        ArrayAssert.itemsAreSame(
            ['Tut', 'tut', 'it', 'looks', 'like', 'rain'],
            WB.getWords('Tut-tut, it looks like rain.')
        );
    },

    'getWords() should support an includePunctuation option': function () {
        ArrayAssert.itemsAreSame(
            ['Tut', '-', 'tut', ',', 'it', 'looks', 'like', 'rain', '.'],
            WB.getWords('Tut-tut, it looks like rain.', {includePunctuation: true})
        );
    },

    'getWords() should support an includeWhitespace option': function () {
        ArrayAssert.itemsAreSame(
            ['foo', ' ', 'bar', ' ', 'baz'],
            WB.getWords('foo bar baz', {includeWhitespace: true})
        );

        ArrayAssert.itemsAreSame(
            ['foo', ' ', ' ', 'bar'],
            WB.getWords('foo  bar', {includeWhitespace: true})
        );

        ArrayAssert.itemsAreSame(
            ['foo', '\t', 'bar'],
            WB.getWords('foo\tbar', {includeWhitespace: true})
        );

        ArrayAssert.itemsAreSame(
            ['foo', '\n', 'bar'],
            WB.getWords('foo\nbar', {includeWhitespace: true})
        );
    },

    // -- getUniqueWords() -----------------------------------------------------
    'getUniqueWords() should only return unique words': function () {
        ArrayAssert.itemsAreSame(['hungry', 'hippo'], WB.getUniqueWords('hungry hungry hippo'));
    }
}));

}, '@VERSION@', {requires:['text-wordbreak', 'test']});