|  | // Copyright (c) 2011 The Chromium Authors. All rights reserved. | 
|  | // Use of this source code is governed by a BSD-style license that can be | 
|  | // found in the LICENSE file. | 
|  |  | 
|  | #include "base/i18n/char_iterator.h" | 
|  |  | 
|  | #include "base/strings/utf_string_conversions.h" | 
|  | #include "testing/gtest/include/gtest/gtest.h" | 
|  |  | 
|  | namespace base { | 
|  | namespace i18n { | 
|  |  | 
|  | TEST(CharIteratorsTest, TestUTF8) { | 
|  | std::string empty; | 
|  | UTF8CharIterator empty_iter(&empty); | 
|  | ASSERT_TRUE(empty_iter.end()); | 
|  | ASSERT_EQ(0, empty_iter.array_pos()); | 
|  | ASSERT_EQ(0, empty_iter.char_pos()); | 
|  | ASSERT_FALSE(empty_iter.Advance()); | 
|  |  | 
|  | std::string str("s\303\273r");  // [u with circumflex] | 
|  | UTF8CharIterator iter(&str); | 
|  | ASSERT_FALSE(iter.end()); | 
|  | ASSERT_EQ(0, iter.array_pos()); | 
|  | ASSERT_EQ(0, iter.char_pos()); | 
|  | ASSERT_EQ('s', iter.get()); | 
|  | ASSERT_TRUE(iter.Advance()); | 
|  |  | 
|  | ASSERT_FALSE(iter.end()); | 
|  | ASSERT_EQ(1, iter.array_pos()); | 
|  | ASSERT_EQ(1, iter.char_pos()); | 
|  | ASSERT_EQ(251, iter.get()); | 
|  | ASSERT_TRUE(iter.Advance()); | 
|  |  | 
|  | ASSERT_FALSE(iter.end()); | 
|  | ASSERT_EQ(3, iter.array_pos()); | 
|  | ASSERT_EQ(2, iter.char_pos()); | 
|  | ASSERT_EQ('r', iter.get()); | 
|  | ASSERT_TRUE(iter.Advance()); | 
|  |  | 
|  | ASSERT_TRUE(iter.end()); | 
|  | ASSERT_EQ(4, iter.array_pos()); | 
|  | ASSERT_EQ(3, iter.char_pos()); | 
|  |  | 
|  | // Don't care what it returns, but this shouldn't crash | 
|  | iter.get(); | 
|  |  | 
|  | ASSERT_FALSE(iter.Advance()); | 
|  | } | 
|  |  | 
|  | TEST(CharIteratorsTest, TestUTF16) { | 
|  | string16 empty = UTF8ToUTF16(""); | 
|  | UTF16CharIterator empty_iter(&empty); | 
|  | ASSERT_TRUE(empty_iter.end()); | 
|  | ASSERT_EQ(0, empty_iter.array_pos()); | 
|  | ASSERT_EQ(0, empty_iter.char_pos()); | 
|  | ASSERT_FALSE(empty_iter.Advance()); | 
|  |  | 
|  | // This test string contains 4 characters: | 
|  | //   x | 
|  | //   u with circumflex - 2 bytes in UTF8, 1 codeword in UTF16 | 
|  | //   math double-struck A - 4 bytes in UTF8, 2 codewords in UTF16 | 
|  | //   z | 
|  | string16 str = UTF8ToUTF16("x\303\273\360\235\224\270z"); | 
|  | UTF16CharIterator iter(&str); | 
|  | ASSERT_FALSE(iter.end()); | 
|  | ASSERT_EQ(0, iter.array_pos()); | 
|  | ASSERT_EQ(0, iter.char_pos()); | 
|  | ASSERT_EQ('x', iter.get()); | 
|  | ASSERT_TRUE(iter.Advance()); | 
|  |  | 
|  | ASSERT_FALSE(iter.end()); | 
|  | ASSERT_EQ(1, iter.array_pos()); | 
|  | ASSERT_EQ(1, iter.char_pos()); | 
|  | ASSERT_EQ(251, iter.get()); | 
|  | ASSERT_TRUE(iter.Advance()); | 
|  |  | 
|  | ASSERT_FALSE(iter.end()); | 
|  | ASSERT_EQ(2, iter.array_pos()); | 
|  | ASSERT_EQ(2, iter.char_pos()); | 
|  | ASSERT_EQ(120120, iter.get()); | 
|  | ASSERT_TRUE(iter.Advance()); | 
|  |  | 
|  | ASSERT_FALSE(iter.end()); | 
|  | ASSERT_EQ(4, iter.array_pos()); | 
|  | ASSERT_EQ(3, iter.char_pos()); | 
|  | ASSERT_EQ('z', iter.get()); | 
|  | ASSERT_TRUE(iter.Advance()); | 
|  |  | 
|  | ASSERT_TRUE(iter.end()); | 
|  | ASSERT_EQ(5, iter.array_pos()); | 
|  | ASSERT_EQ(4, iter.char_pos()); | 
|  |  | 
|  | // Don't care what it returns, but this shouldn't crash | 
|  | iter.get(); | 
|  |  | 
|  | ASSERT_FALSE(iter.Advance()); | 
|  | } | 
|  |  | 
|  | }  // namespace i18n | 
|  | }  // namespace base |