Blame - talk/base/stringencode_unittest.cc - webrtc.googlesource.com/src

blob: c1ec53fa1aefd5a0985750b4b0653b4cc5630574 [file] [log] [blame]

henrike@webrtc.org	28e2075	2013-07-10 00:45:36 +0000	[diff] [blame]	1	/*
				2	* libjingle
				3	* Copyright 2004, Google Inc.
				4	*
				5	* Redistribution and use in source and binary forms, with or without
				6	* modification, are permitted provided that the following conditions are met:
				7	*
				8	* 1. Redistributions of source code must retain the above copyright notice,
				9	* this list of conditions and the following disclaimer.
				10	* 2. Redistributions in binary form must reproduce the above copyright notice,
				11	* this list of conditions and the following disclaimer in the documentation
				12	* and/or other materials provided with the distribution.
				13	* 3. The name of the author may not be used to endorse or promote products
				14	* derived from this software without specific prior written permission.
				15	*
				16	* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED
				17	* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
				18	* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
				19	* EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
				20	* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
				21	* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
				22	* OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
				23	* WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
				24	* OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
				25	* ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
				26	*/
				27
				28	#include "talk/base/common.h"
				29	#include "talk/base/gunit.h"
				30	#include "talk/base/stringencode.h"
				31	#include "talk/base/stringutils.h"
				32
				33	namespace talk_base {
				34
				35	TEST(Utf8EncodeTest, EncodeDecode) {
				36	const struct Utf8Test {
				37	const char* encoded;
				38	size_t encsize, enclen;
				39	unsigned long decoded;
				40	} kTests[] = {
				41	{ "a ", 5, 1, 'a' },
				42	{ "\x7F ", 5, 1, 0x7F },
				43	{ "\xC2\x80 ", 5, 2, 0x80 },
				44	{ "\xDF\xBF ", 5, 2, 0x7FF },
				45	{ "\xE0\xA0\x80 ", 5, 3, 0x800 },
				46	{ "\xEF\xBF\xBF ", 5, 3, 0xFFFF },
				47	{ "\xF0\x90\x80\x80 ", 5, 4, 0x10000 },
				48	{ "\xF0\x90\x80\x80 ", 3, 0, 0x10000 },
				49	{ "\xF0\xF0\x80\x80 ", 5, 0, 0 },
				50	{ "\xF0\x90\x80 ", 5, 0, 0 },
				51	{ "\x90\x80\x80 ", 5, 0, 0 },
				52	{ NULL, 0, 0 },
				53	};
				54	for (size_t i = 0; kTests[i].encoded; ++i) {
				55	unsigned long val = 0;
				56	ASSERT_EQ(kTests[i].enclen, utf8_decode(kTests[i].encoded,
				57	kTests[i].encsize,
				58	&val));
				59	unsigned long result = (kTests[i].enclen == 0) ? 0 : kTests[i].decoded;
				60	ASSERT_EQ(result, val);
				61
				62	if (kTests[i].decoded == 0) {
				63	// Not an interesting encoding test case
				64	continue;
				65	}
				66
				67	char buffer[5];
				68	memset(buffer, 0x01, ARRAY_SIZE(buffer));
				69	ASSERT_EQ(kTests[i].enclen, utf8_encode(buffer,
				70	kTests[i].encsize,
				71	kTests[i].decoded));
				72	ASSERT_TRUE(memcmp(buffer, kTests[i].encoded, kTests[i].enclen) == 0);
				73	// Make sure remainder of buffer is unchanged
				74	ASSERT_TRUE(memory_check(buffer + kTests[i].enclen,
				75	0x1,
				76	ARRAY_SIZE(buffer) - kTests[i].enclen));
				77	}
				78	}
				79
				80	class HexEncodeTest : public testing::Test {
				81	public:
				82	HexEncodeTest() : enc_res_(0), dec_res_(0) {
				83	for (size_t i = 0; i < sizeof(data_); ++i) {
				84	data_[i] = (i + 128) & 0xff;
				85	}
				86	memset(decoded_, 0x7f, sizeof(decoded_));
				87	}
				88
				89	char data_[10];
				90	char encoded_[31];
				91	char decoded_[11];
				92	size_t enc_res_;
				93	size_t dec_res_;
				94	};
				95
				96	// Test that we can convert to/from hex with no delimiter.
				97	TEST_F(HexEncodeTest, TestWithNoDelimiter) {
				98	enc_res_ = hex_encode(encoded_, sizeof(encoded_), data_, sizeof(data_));
				99	ASSERT_EQ(sizeof(data_) * 2, enc_res_);
				100	ASSERT_STREQ("80818283848586878889", encoded_);
				101	dec_res_ = hex_decode(decoded_, sizeof(decoded_), encoded_, enc_res_);
				102	ASSERT_EQ(sizeof(data_), dec_res_);
				103	ASSERT_EQ(0, memcmp(data_, decoded_, dec_res_));
				104	}
				105
				106	// Test that we can convert to/from hex with a colon delimiter.
				107	TEST_F(HexEncodeTest, TestWithDelimiter) {
				108	enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(encoded_),
				109	data_, sizeof(data_), ':');
				110	ASSERT_EQ(sizeof(data_) * 3 - 1, enc_res_);
				111	ASSERT_STREQ("80:81:82:83:84:85:86:87:88:89", encoded_);
				112	dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_),
				113	encoded_, enc_res_, ':');
				114	ASSERT_EQ(sizeof(data_), dec_res_);
				115	ASSERT_EQ(0, memcmp(data_, decoded_, dec_res_));
				116	}
				117
				118	// Test that encoding with one delimiter and decoding with another fails.
				119	TEST_F(HexEncodeTest, TestWithWrongDelimiter) {
				120	enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(encoded_),
				121	data_, sizeof(data_), ':');
				122	ASSERT_EQ(sizeof(data_) * 3 - 1, enc_res_);
				123	dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_),
				124	encoded_, enc_res_, '/');
				125	ASSERT_EQ(0U, dec_res_);
				126	}
				127
				128	// Test that encoding without a delimiter and decoding with one fails.
				129	TEST_F(HexEncodeTest, TestExpectedDelimiter) {
				130	enc_res_ = hex_encode(encoded_, sizeof(encoded_), data_, sizeof(data_));
				131	ASSERT_EQ(sizeof(data_) * 2, enc_res_);
				132	dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_),
				133	encoded_, enc_res_, ':');
				134	ASSERT_EQ(0U, dec_res_);
				135	}
				136
				137	// Test that encoding with a delimiter and decoding without one fails.
				138	TEST_F(HexEncodeTest, TestExpectedNoDelimiter) {
				139	enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(encoded_),
				140	data_, sizeof(data_), ':');
				141	ASSERT_EQ(sizeof(data_) * 3 - 1, enc_res_);
				142	dec_res_ = hex_decode(decoded_, sizeof(decoded_), encoded_, enc_res_);
				143	ASSERT_EQ(0U, dec_res_);
				144	}
				145
				146	// Test that we handle a zero-length buffer with no delimiter.
				147	TEST_F(HexEncodeTest, TestZeroLengthNoDelimiter) {
				148	enc_res_ = hex_encode(encoded_, sizeof(encoded_), "", 0);
				149	ASSERT_EQ(0U, enc_res_);
				150	dec_res_ = hex_decode(decoded_, sizeof(decoded_), encoded_, enc_res_);
				151	ASSERT_EQ(0U, dec_res_);
				152	}
				153
				154	// Test that we handle a zero-length buffer with a delimiter.
				155	TEST_F(HexEncodeTest, TestZeroLengthWithDelimiter) {
				156	enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(encoded_), "", 0, ':');
				157	ASSERT_EQ(0U, enc_res_);
				158	dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_),
				159	encoded_, enc_res_, ':');
				160	ASSERT_EQ(0U, dec_res_);
				161	}
				162
				163	// Test the std::string variants that take no delimiter.
				164	TEST_F(HexEncodeTest, TestHelpersNoDelimiter) {
				165	std::string result = hex_encode(data_, sizeof(data_));
				166	ASSERT_EQ("80818283848586878889", result);
				167	dec_res_ = hex_decode(decoded_, sizeof(decoded_), result);
				168	ASSERT_EQ(sizeof(data_), dec_res_);
				169	ASSERT_EQ(0, memcmp(data_, decoded_, dec_res_));
				170	}
				171
				172	// Test the std::string variants that use a delimiter.
				173	TEST_F(HexEncodeTest, TestHelpersWithDelimiter) {
				174	std::string result = hex_encode_with_delimiter(data_, sizeof(data_), ':');
				175	ASSERT_EQ("80:81:82:83:84:85:86:87:88:89", result);
				176	dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_), result, ':');
				177	ASSERT_EQ(sizeof(data_), dec_res_);
				178	ASSERT_EQ(0, memcmp(data_, decoded_, dec_res_));
				179	}
				180
				181	// Test that encoding into a too-small output buffer (without delimiter) fails.
				182	TEST_F(HexEncodeTest, TestEncodeTooShort) {
				183	enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(data_) * 2,
				184	data_, sizeof(data_), 0);
				185	ASSERT_EQ(0U, enc_res_);
				186	}
				187
				188	// Test that encoding into a too-small output buffer (with delimiter) fails.
				189	TEST_F(HexEncodeTest, TestEncodeWithDelimiterTooShort) {
				190	enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(data_) * 3 - 1,
				191	data_, sizeof(data_), ':');
				192	ASSERT_EQ(0U, enc_res_);
				193	}
				194
				195	// Test that decoding into a too-small output buffer fails.
				196	TEST_F(HexEncodeTest, TestDecodeTooShort) {
				197	dec_res_ = hex_decode_with_delimiter(decoded_, 4, "0123456789", 10, 0);
				198	ASSERT_EQ(0U, dec_res_);
				199	ASSERT_EQ(0x7f, decoded_[4]);
				200	}
				201
				202	// Test that decoding non-hex data fails.
				203	TEST_F(HexEncodeTest, TestDecodeBogusData) {
				204	dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_), "xyz", 3, 0);
				205	ASSERT_EQ(0U, dec_res_);
				206	}
				207
				208	// Test that decoding an odd number of hex characters fails.
				209	TEST_F(HexEncodeTest, TestDecodeOddHexDigits) {
				210	dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_), "012", 3, 0);
				211	ASSERT_EQ(0U, dec_res_);
				212	}
				213
				214	// Test that decoding a string with too many delimiters fails.
				215	TEST_F(HexEncodeTest, TestDecodeWithDelimiterTooManyDelimiters) {
				216	dec_res_ = hex_decode_with_delimiter(decoded_, 4, "01::23::45::67", 14, ':');
				217	ASSERT_EQ(0U, dec_res_);
				218	}
				219
				220	// Test that decoding a string with a leading delimiter fails.
				221	TEST_F(HexEncodeTest, TestDecodeWithDelimiterLeadingDelimiter) {
				222	dec_res_ = hex_decode_with_delimiter(decoded_, 4, ":01:23:45:67", 12, ':');
				223	ASSERT_EQ(0U, dec_res_);
				224	}
				225
				226	// Test that decoding a string with a trailing delimiter fails.
				227	TEST_F(HexEncodeTest, TestDecodeWithDelimiterTrailingDelimiter) {
				228	dec_res_ = hex_decode_with_delimiter(decoded_, 4, "01:23:45:67:", 12, ':');
				229	ASSERT_EQ(0U, dec_res_);
				230	}
				231
				232	// Tests counting substrings.
				233	TEST(TokenizeTest, CountSubstrings) {
				234	std::vector<std::string> fields;
				235
				236	EXPECT_EQ(5ul, tokenize("one two three four five", ' ', &fields));
				237	fields.clear();
				238	EXPECT_EQ(1ul, tokenize("one", ' ', &fields));
				239
				240	// Extra spaces should be ignored.
				241	fields.clear();
				242	EXPECT_EQ(5ul, tokenize(" one two three four five ", ' ', &fields));
				243	fields.clear();
				244	EXPECT_EQ(1ul, tokenize(" one ", ' ', &fields));
				245	fields.clear();
				246	EXPECT_EQ(0ul, tokenize(" ", ' ', &fields));
				247	}
				248
				249	// Tests comparing substrings.
				250	TEST(TokenizeTest, CompareSubstrings) {
				251	std::vector<std::string> fields;
				252
				253	tokenize("find middle one", ' ', &fields);
				254	ASSERT_EQ(3ul, fields.size());
				255	ASSERT_STREQ("middle", fields.at(1).c_str());
				256	fields.clear();
				257
				258	// Extra spaces should be ignored.
				259	tokenize(" find middle one ", ' ', &fields);
				260	ASSERT_EQ(3ul, fields.size());
				261	ASSERT_STREQ("middle", fields.at(1).c_str());
				262	fields.clear();
				263	tokenize(" ", ' ', &fields);
				264	ASSERT_EQ(0ul, fields.size());
				265	}
				266
				267	TEST(TokenizeTest, TokenizeAppend) {
				268	ASSERT_EQ(0ul, tokenize_append("A B C", ' ', NULL));
				269
				270	std::vector<std::string> fields;
				271
				272	tokenize_append("A B C", ' ', &fields);
				273	ASSERT_EQ(3ul, fields.size());
				274	ASSERT_STREQ("B", fields.at(1).c_str());
				275
				276	tokenize_append("D E", ' ', &fields);
				277	ASSERT_EQ(5ul, fields.size());
				278	ASSERT_STREQ("B", fields.at(1).c_str());
				279	ASSERT_STREQ("E", fields.at(4).c_str());
				280	}
				281
				282	TEST(TokenizeTest, TokenizeWithMarks) {
				283	ASSERT_EQ(0ul, tokenize("D \"A B", ' ', '(', ')', NULL));
				284
				285	std::vector<std::string> fields;
				286	tokenize("A B C", ' ', '"', '"', &fields);
				287	ASSERT_EQ(3ul, fields.size());
				288	ASSERT_STREQ("C", fields.at(2).c_str());
				289
				290	tokenize("\"A B\" C", ' ', '"', '"', &fields);
				291	ASSERT_EQ(2ul, fields.size());
				292	ASSERT_STREQ("A B", fields.at(0).c_str());
				293
				294	tokenize("D \"A B\" C", ' ', '"', '"', &fields);
				295	ASSERT_EQ(3ul, fields.size());
				296	ASSERT_STREQ("D", fields.at(0).c_str());
				297	ASSERT_STREQ("A B", fields.at(1).c_str());
				298
				299	tokenize("D \"A B\" C \"E F\"", ' ', '"', '"', &fields);
				300	ASSERT_EQ(4ul, fields.size());
				301	ASSERT_STREQ("D", fields.at(0).c_str());
				302	ASSERT_STREQ("A B", fields.at(1).c_str());
				303	ASSERT_STREQ("E F", fields.at(3).c_str());
				304
				305	// No matching marks.
				306	tokenize("D \"A B", ' ', '"', '"', &fields);
				307	ASSERT_EQ(3ul, fields.size());
				308	ASSERT_STREQ("D", fields.at(0).c_str());
				309	ASSERT_STREQ("\"A", fields.at(1).c_str());
				310
				311	tokenize("D (A B) C (E F) G", ' ', '(', ')', &fields);
				312	ASSERT_EQ(5ul, fields.size());
				313	ASSERT_STREQ("D", fields.at(0).c_str());
				314	ASSERT_STREQ("A B", fields.at(1).c_str());
				315	ASSERT_STREQ("E F", fields.at(3).c_str());
				316	}
				317
				318	// Tests counting substrings.
				319	TEST(SplitTest, CountSubstrings) {
				320	std::vector<std::string> fields;
				321
				322	EXPECT_EQ(5ul, split("one,two,three,four,five", ',', &fields));
				323	fields.clear();
				324	EXPECT_EQ(1ul, split("one", ',', &fields));
				325
				326	// Empty fields between commas count.
				327	fields.clear();
				328	EXPECT_EQ(5ul, split("one,,three,four,five", ',', &fields));
				329	fields.clear();
				330	EXPECT_EQ(3ul, split(",three,", ',', &fields));
				331	fields.clear();
				332	EXPECT_EQ(1ul, split("", ',', &fields));
				333	}
				334
				335	// Tests comparing substrings.
				336	TEST(SplitTest, CompareSubstrings) {
				337	std::vector<std::string> fields;
				338
				339	split("find,middle,one", ',', &fields);
				340	ASSERT_EQ(3ul, fields.size());
				341	ASSERT_STREQ("middle", fields.at(1).c_str());
				342	fields.clear();
				343
				344	// Empty fields between commas count.
				345	split("find,,middle,one", ',', &fields);
				346	ASSERT_EQ(4ul, fields.size());
				347	ASSERT_STREQ("middle", fields.at(2).c_str());
				348	fields.clear();
				349	split("", ',', &fields);
				350	ASSERT_EQ(1ul, fields.size());
				351	ASSERT_STREQ("", fields.at(0).c_str());
				352	}
				353
				354	TEST(BoolTest, DecodeValid) {
				355	bool value;
				356	EXPECT_TRUE(FromString("true", &value));
				357	EXPECT_TRUE(value);
				358	EXPECT_TRUE(FromString("true,", &value));
				359	EXPECT_TRUE(value);
				360	EXPECT_TRUE(FromString("true , true", &value));
				361	EXPECT_TRUE(value);
				362	EXPECT_TRUE(FromString("true ,\n false", &value));
				363	EXPECT_TRUE(value);
				364	EXPECT_TRUE(FromString(" true \n", &value));
				365	EXPECT_TRUE(value);
				366
				367	EXPECT_TRUE(FromString("false", &value));
				368	EXPECT_FALSE(value);
				369	EXPECT_TRUE(FromString(" false ", &value));
				370	EXPECT_FALSE(value);
				371	EXPECT_TRUE(FromString(" false, ", &value));
				372	EXPECT_FALSE(value);
				373
				374	EXPECT_TRUE(FromString<bool>("true\n"));
				375	EXPECT_FALSE(FromString<bool>("false\n"));
				376	}
				377
				378	TEST(BoolTest, DecodeInvalid) {
				379	bool value;
				380	EXPECT_FALSE(FromString("True", &value));
				381	EXPECT_FALSE(FromString("TRUE", &value));
				382	EXPECT_FALSE(FromString("False", &value));
				383	EXPECT_FALSE(FromString("FALSE", &value));
				384	EXPECT_FALSE(FromString("0", &value));
				385	EXPECT_FALSE(FromString("1", &value));
				386	EXPECT_FALSE(FromString("0,", &value));
				387	EXPECT_FALSE(FromString("1,", &value));
				388	EXPECT_FALSE(FromString("1,0", &value));
				389	EXPECT_FALSE(FromString("1.", &value));
				390	EXPECT_FALSE(FromString("1.0", &value));
				391	EXPECT_FALSE(FromString("", &value));
				392	EXPECT_FALSE(FromString<bool>("false\nfalse"));
				393	}
				394
				395	TEST(BoolTest, RoundTrip) {
				396	bool value;
				397	EXPECT_TRUE(FromString(ToString(true), &value));
				398	EXPECT_TRUE(value);
				399	EXPECT_TRUE(FromString(ToString(false), &value));
				400	EXPECT_FALSE(value);
				401	}
				402	} // namespace talk_base