blob: fc1f481e22ac9644754278f3b4d8c0eeab8110d7 [file] [log] [blame]
/*
* libjingle
* Copyright 2004--2011, Google Inc.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are met:
*
* 1. Redistributions of source code must retain the above copyright notice,
* this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright notice,
* this list of conditions and the following disclaimer in the documentation
* and/or other materials provided with the distribution.
* 3. The name of the author may not be used to endorse or promote products
* derived from this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED
* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
* EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
* OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
* WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
* OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
* ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#include "talk/base/common.h"
#include "talk/base/gunit.h"
#include "talk/base/stringencode.h"
#include "talk/base/stringutils.h"
namespace talk_base {
TEST(utf8_encode, EncodeDecode) {
const struct Utf8Test {
const char* encoded;
size_t encsize, enclen;
unsigned long decoded;
} kTests[] = {
{ "a ", 5, 1, 'a' },
{ "\x7F ", 5, 1, 0x7F },
{ "\xC2\x80 ", 5, 2, 0x80 },
{ "\xDF\xBF ", 5, 2, 0x7FF },
{ "\xE0\xA0\x80 ", 5, 3, 0x800 },
{ "\xEF\xBF\xBF ", 5, 3, 0xFFFF },
{ "\xF0\x90\x80\x80 ", 5, 4, 0x10000 },
{ "\xF0\x90\x80\x80 ", 3, 0, 0x10000 },
{ "\xF0\xF0\x80\x80 ", 5, 0, 0 },
{ "\xF0\x90\x80 ", 5, 0, 0 },
{ "\x90\x80\x80 ", 5, 0, 0 },
{ NULL, 0, 0 },
};
for (size_t i=0; kTests[i].encoded; ++i) {
unsigned long val = 0;
ASSERT_EQ(kTests[i].enclen, utf8_decode(kTests[i].encoded,
kTests[i].encsize,
&val));
unsigned long result = (kTests[i].enclen == 0) ? 0 : kTests[i].decoded;
ASSERT_EQ(result, val);
if (kTests[i].decoded == 0) {
// Not an interesting encoding test case
continue;
}
char buffer[5];
memset(buffer, 0x01, ARRAY_SIZE(buffer));
ASSERT_EQ(kTests[i].enclen, utf8_encode(buffer,
kTests[i].encsize,
kTests[i].decoded));
ASSERT_TRUE(memcmp(buffer, kTests[i].encoded, kTests[i].enclen) == 0);
// Make sure remainder of buffer is unchanged
ASSERT_TRUE(memory_check(buffer + kTests[i].enclen,
0x1,
ARRAY_SIZE(buffer) - kTests[i].enclen));
}
}
// TODO: hex_encode unittest
// Tests counting substrings.
TEST(tokenizeTest, CountSubstrings) {
std::vector<std::string> fields;
EXPECT_EQ(5ul, tokenize("one two three four five", ' ', &fields));
fields.clear();
EXPECT_EQ(1ul, tokenize("one", ' ', &fields));
// Extra spaces should be ignored.
fields.clear();
EXPECT_EQ(5ul, tokenize(" one two three four five ", ' ', &fields));
fields.clear();
EXPECT_EQ(1ul, tokenize(" one ", ' ', &fields));
fields.clear();
EXPECT_EQ(0ul, tokenize(" ", ' ', &fields));
}
// Tests comparing substrings.
TEST(tokenizeTest, CompareSubstrings) {
std::vector<std::string> fields;
tokenize("find middle one", ' ', &fields);
ASSERT_EQ(3ul, fields.size());
ASSERT_STREQ("middle", fields.at(1).c_str());
fields.clear();
// Extra spaces should be ignored.
tokenize(" find middle one ", ' ', &fields);
ASSERT_EQ(3ul, fields.size());
ASSERT_STREQ("middle", fields.at(1).c_str());
fields.clear();
tokenize(" ", ' ', &fields);
ASSERT_EQ(0ul, fields.size());
}
TEST(tokenizeTest, TokenizeAppend) {
ASSERT_EQ(0ul, tokenize_append("A B C", ' ', NULL));
std::vector<std::string> fields;
tokenize_append("A B C", ' ', &fields);
ASSERT_EQ(3ul, fields.size());
ASSERT_STREQ("B", fields.at(1).c_str());
tokenize_append("D E", ' ', &fields);
ASSERT_EQ(5ul, fields.size());
ASSERT_STREQ("B", fields.at(1).c_str());
ASSERT_STREQ("E", fields.at(4).c_str());
}
TEST(tokenizeTest, TokenizeWithMarks) {
ASSERT_EQ(0ul, tokenize("D \"A B", ' ', '(', ')', NULL));
std::vector<std::string> fields;
tokenize("A B C", ' ', '"', '"', &fields);
ASSERT_EQ(3ul, fields.size());
ASSERT_STREQ("C", fields.at(2).c_str());
tokenize("\"A B\" C", ' ', '"', '"', &fields);
ASSERT_EQ(2ul, fields.size());
ASSERT_STREQ("A B", fields.at(0).c_str());
tokenize("D \"A B\" C", ' ', '"', '"', &fields);
ASSERT_EQ(3ul, fields.size());
ASSERT_STREQ("D", fields.at(0).c_str());
ASSERT_STREQ("A B", fields.at(1).c_str());
tokenize("D \"A B\" C \"E F\"", ' ', '"', '"', &fields);
ASSERT_EQ(4ul, fields.size());
ASSERT_STREQ("D", fields.at(0).c_str());
ASSERT_STREQ("A B", fields.at(1).c_str());
ASSERT_STREQ("E F", fields.at(3).c_str());
// No matching marks.
tokenize("D \"A B", ' ', '"', '"', &fields);
ASSERT_EQ(3ul, fields.size());
ASSERT_STREQ("D", fields.at(0).c_str());
ASSERT_STREQ("\"A", fields.at(1).c_str());
tokenize("D (A B) C (E F) G", ' ', '(', ')', &fields);
ASSERT_EQ(5ul, fields.size());
ASSERT_STREQ("D", fields.at(0).c_str());
ASSERT_STREQ("A B", fields.at(1).c_str());
ASSERT_STREQ("E F", fields.at(3).c_str());
}
// Tests counting substrings.
TEST(splitTest, CountSubstrings) {
std::vector<std::string> fields;
EXPECT_EQ(5ul, split("one,two,three,four,five", ',', &fields));
fields.clear();
EXPECT_EQ(1ul, split("one", ',', &fields));
// Empty fields between commas count.
fields.clear();
EXPECT_EQ(5ul, split("one,,three,four,five", ',', &fields));
fields.clear();
EXPECT_EQ(3ul, split(",three,", ',', &fields));
fields.clear();
EXPECT_EQ(1ul, split("", ',', &fields));
}
// Tests comparing substrings.
TEST(splitTest, CompareSubstrings) {
std::vector<std::string> fields;
split("find,middle,one", ',', &fields);
ASSERT_EQ(3ul, fields.size());
ASSERT_STREQ("middle", fields.at(1).c_str());
fields.clear();
// Empty fields between commas count.
split("find,,middle,one", ',', &fields);
ASSERT_EQ(4ul, fields.size());
ASSERT_STREQ("middle", fields.at(2).c_str());
fields.clear();
split("", ',', &fields);
ASSERT_EQ(1ul, fields.size());
ASSERT_STREQ("", fields.at(0).c_str());
}
} // namespace talk_base