89 lines
3.7 KiB
Text
89 lines
3.7 KiB
Text
-- Copyright (c) 2013, Thomas Goyne <plorkyeran@aegisub.org>
|
||
--
|
||
-- Permission to use, copy, modify, and distribute this software for any
|
||
-- purpose with or without fee is hereby granted, provided that the above
|
||
-- copyright notice and this permission notice appear in all copies.
|
||
--
|
||
-- THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
|
||
-- WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
|
||
-- MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
|
||
-- ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
|
||
-- WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
|
||
-- ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
|
||
-- OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
|
||
|
||
unicode = require 'aegisub.unicode'
|
||
|
||
describe 'charwidth', ->
|
||
it 'should return 1 for an ascii character', ->
|
||
assert.is.equal 1, unicode.charwidth 'a'
|
||
it 'should return 2 for a two byte character', ->
|
||
assert.is.equal 2, unicode.charwidth 'ß'
|
||
it 'should return 3 for a three byte character', ->
|
||
assert.is.equal 3, unicode.charwidth 'c'
|
||
it 'should return 4 for a four byte character', ->
|
||
assert.is.equal 4, unicode.charwidth '🄓'
|
||
|
||
describe 'char_iterator', ->
|
||
it 'should iterator over multi-byte codepoints', ->
|
||
chars = [c for c in unicode.chars 'aßc🄓']
|
||
assert.is.equal 4, #chars
|
||
assert.is.equal chars[1], 'a'
|
||
assert.is.equal chars[2], 'ß'
|
||
assert.is.equal chars[3], 'c'
|
||
assert.is.equal chars[4], '🄓'
|
||
|
||
describe 'len', ->
|
||
it 'should give length in codepoints', ->
|
||
assert.is.equal 4, unicode.len 'aßc🄓'
|
||
|
||
describe 'codepoint', ->
|
||
it 'should give codepoint as an integer for a string', ->
|
||
assert.is.equal 97, unicode.codepoint 'a'
|
||
assert.is.equal 223, unicode.codepoint 'ß'
|
||
assert.is.equal 0xFF43, unicode.codepoint 'c'
|
||
assert.is.equal 0x1F113, unicode.codepoint '🄓'
|
||
it 'should give ignore codepoints after the first', ->
|
||
assert.is.equal 97, unicode.codepoint 'abc'
|
||
|
||
describe 'to_upper_case', ->
|
||
it 'should support plain ASCII', ->
|
||
assert.is.equal 'ABC', unicode.to_upper_case 'abc'
|
||
it 'should support accents', ->
|
||
assert.is.equal 'ÀÈÌ', unicode.to_upper_case 'àèì'
|
||
it 'should support fullwidth letters', ->
|
||
assert.is.equal 'ABC', unicode.to_upper_case 'abc'
|
||
it 'should support greek', ->
|
||
assert.is.equal 'ΑΒΓ', unicode.to_upper_case 'αβγ'
|
||
it 'should support sharp-s', ->
|
||
assert.is.equal 'SS', unicode.to_upper_case 'ß'
|
||
it 'should support ligatures', ->
|
||
assert.is.equal 'FFI', unicode.to_upper_case 'ffi'
|
||
|
||
describe 'to_lower_case', ->
|
||
it 'should support plain ASCII', ->
|
||
assert.is.equal 'abc', unicode.to_lower_case 'ABC'
|
||
it 'should support accents', ->
|
||
assert.is.equal 'àèì', unicode.to_lower_case 'ÀÈÌ'
|
||
it 'should support fullwidth letters', ->
|
||
assert.is.equal 'abc', unicode.to_lower_case 'ABC'
|
||
it 'should support greek', ->
|
||
assert.is.equal 'αβγ', unicode.to_lower_case 'ΑΒΓ'
|
||
it 'should support sharp-s', ->
|
||
assert.is.equal 'ß', unicode.to_lower_case 'ẞ'
|
||
-- note: Unicode doesn't have any uppercase precomposed ligatures
|
||
|
||
describe 'to_fold_case', ->
|
||
it 'should support plain ASCII', ->
|
||
assert.is.equal 'abc', unicode.to_fold_case 'ABC'
|
||
it 'should support accents', ->
|
||
assert.is.equal 'àèì', unicode.to_fold_case 'ÀÈÌ'
|
||
it 'should support fullwidth letters', ->
|
||
assert.is.equal 'abc', unicode.to_fold_case 'ABC'
|
||
it 'should support greek', ->
|
||
assert.is.equal 'αβγ', unicode.to_fold_case 'ΑΒΓ'
|
||
it 'should support sharp-s', ->
|
||
assert.is.equal 'ss', unicode.to_fold_case 'ẞ'
|
||
it 'should support ligatures', ->
|
||
assert.is.equal 'ffi', unicode.to_fold_case 'ffi'
|
||
|