1 # -*- coding: utf-8 -*-
4 class UTF8Test < ActiveSupport::TestCase
6 assert_equal true, UTF8.valid?("test")
7 assert_equal true, UTF8.valid?("vergrößern")
8 assert_equal true, UTF8.valid?("ルシステムにも対応します")
9 assert_equal true, UTF8.valid?("輕觸搖晃的遊戲")
11 assert_equal false, UTF8.valid?("\xC0") # always invalid utf8
12 assert_equal false, UTF8.valid?("\xC2\x4a") # 2-byte multibyte identifier, followed by plain ASCII
13 assert_equal false, UTF8.valid?("\xC2\xC2") # 2-byte multibyte identifier, followed by another one
14 assert_equal false, UTF8.valid?("\x4a\x82") # plain ASCII, followed by multibyte continuation
15 assert_equal false, UTF8.valid?("\x82\x82") # multibyte continuations without multibyte identifier
16 assert_equal false, UTF8.valid?("\xe1\x82\x4a") # three-byte identifier, contination and (incorrectly) plain ASCII