1 /*
2  *  Copyright 2004 The WebRTC Project Authors. All rights reserved.
3  *
4  *  Use of this source code is governed by a BSD-style license
5  *  that can be found in the LICENSE file in the root of the source
6  *  tree. An additional intellectual property rights grant can be found
7  *  in the file PATENTS.  All contributing project authors may
8  *  be found in the AUTHORS file in the root of the source tree.
9  */
10 
11 #include "webrtc/base/arraysize.h"
12 #include "webrtc/base/common.h"
13 #include "webrtc/base/gunit.h"
14 #include "webrtc/base/stringencode.h"
15 #include "webrtc/base/stringutils.h"
16 
17 namespace rtc {
18 
TEST(Utf8EncodeTest,EncodeDecode)19 TEST(Utf8EncodeTest, EncodeDecode) {
20   const struct Utf8Test {
21     const char* encoded;
22     size_t encsize, enclen;
23     unsigned long decoded;
24   } kTests[] = {
25     { "a    ",             5, 1, 'a' },
26     { "\x7F    ",          5, 1, 0x7F },
27     { "\xC2\x80   ",       5, 2, 0x80 },
28     { "\xDF\xBF   ",       5, 2, 0x7FF },
29     { "\xE0\xA0\x80  ",    5, 3, 0x800 },
30     { "\xEF\xBF\xBF  ",    5, 3, 0xFFFF },
31     { "\xF0\x90\x80\x80 ", 5, 4, 0x10000 },
32     { "\xF0\x90\x80\x80 ", 3, 0, 0x10000 },
33     { "\xF0\xF0\x80\x80 ", 5, 0, 0 },
34     { "\xF0\x90\x80  ",    5, 0, 0 },
35     { "\x90\x80\x80  ",    5, 0, 0 },
36     { NULL, 0, 0 },
37   };
38   for (size_t i = 0; kTests[i].encoded; ++i) {
39     unsigned long val = 0;
40     ASSERT_EQ(kTests[i].enclen, utf8_decode(kTests[i].encoded,
41                                             kTests[i].encsize,
42                                             &val));
43     unsigned long result = (kTests[i].enclen == 0) ? 0 : kTests[i].decoded;
44     ASSERT_EQ(result, val);
45 
46     if (kTests[i].decoded == 0) {
47       // Not an interesting encoding test case
48       continue;
49     }
50 
51     char buffer[5];
52     memset(buffer, 0x01, arraysize(buffer));
53     ASSERT_EQ(kTests[i].enclen, utf8_encode(buffer,
54                                             kTests[i].encsize,
55                                             kTests[i].decoded));
56     ASSERT_TRUE(memcmp(buffer, kTests[i].encoded, kTests[i].enclen) == 0);
57     // Make sure remainder of buffer is unchanged
58     ASSERT_TRUE(memory_check(buffer + kTests[i].enclen,
59                              0x1,
60                              arraysize(buffer) - kTests[i].enclen));
61   }
62 }
63 
64 class HexEncodeTest : public testing::Test {
65  public:
HexEncodeTest()66   HexEncodeTest() : enc_res_(0), dec_res_(0) {
67     for (size_t i = 0; i < sizeof(data_); ++i) {
68       data_[i] = (i + 128) & 0xff;
69     }
70     memset(decoded_, 0x7f, sizeof(decoded_));
71   }
72 
73   char data_[10];
74   char encoded_[31];
75   char decoded_[11];
76   size_t enc_res_;
77   size_t dec_res_;
78 };
79 
80 // Test that we can convert to/from hex with no delimiter.
TEST_F(HexEncodeTest,TestWithNoDelimiter)81 TEST_F(HexEncodeTest, TestWithNoDelimiter) {
82   enc_res_ = hex_encode(encoded_, sizeof(encoded_), data_, sizeof(data_));
83   ASSERT_EQ(sizeof(data_) * 2, enc_res_);
84   ASSERT_STREQ("80818283848586878889", encoded_);
85   dec_res_ = hex_decode(decoded_, sizeof(decoded_), encoded_, enc_res_);
86   ASSERT_EQ(sizeof(data_), dec_res_);
87   ASSERT_EQ(0, memcmp(data_, decoded_, dec_res_));
88 }
89 
90 // Test that we can convert to/from hex with a colon delimiter.
TEST_F(HexEncodeTest,TestWithDelimiter)91 TEST_F(HexEncodeTest, TestWithDelimiter) {
92   enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(encoded_),
93                                        data_, sizeof(data_), ':');
94   ASSERT_EQ(sizeof(data_) * 3 - 1, enc_res_);
95   ASSERT_STREQ("80:81:82:83:84:85:86:87:88:89", encoded_);
96   dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_),
97                                        encoded_, enc_res_, ':');
98   ASSERT_EQ(sizeof(data_), dec_res_);
99   ASSERT_EQ(0, memcmp(data_, decoded_, dec_res_));
100 }
101 
102 // Test that encoding with one delimiter and decoding with another fails.
TEST_F(HexEncodeTest,TestWithWrongDelimiter)103 TEST_F(HexEncodeTest, TestWithWrongDelimiter) {
104   enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(encoded_),
105                                        data_, sizeof(data_), ':');
106   ASSERT_EQ(sizeof(data_) * 3 - 1, enc_res_);
107   dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_),
108                                        encoded_, enc_res_, '/');
109   ASSERT_EQ(0U, dec_res_);
110 }
111 
112 // Test that encoding without a delimiter and decoding with one fails.
TEST_F(HexEncodeTest,TestExpectedDelimiter)113 TEST_F(HexEncodeTest, TestExpectedDelimiter) {
114   enc_res_ = hex_encode(encoded_, sizeof(encoded_), data_, sizeof(data_));
115   ASSERT_EQ(sizeof(data_) * 2, enc_res_);
116   dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_),
117                                        encoded_, enc_res_, ':');
118   ASSERT_EQ(0U, dec_res_);
119 }
120 
121 // Test that encoding with a delimiter and decoding without one fails.
TEST_F(HexEncodeTest,TestExpectedNoDelimiter)122 TEST_F(HexEncodeTest, TestExpectedNoDelimiter) {
123   enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(encoded_),
124                                        data_, sizeof(data_), ':');
125   ASSERT_EQ(sizeof(data_) * 3 - 1, enc_res_);
126   dec_res_ = hex_decode(decoded_, sizeof(decoded_), encoded_, enc_res_);
127   ASSERT_EQ(0U, dec_res_);
128 }
129 
130 // Test that we handle a zero-length buffer with no delimiter.
TEST_F(HexEncodeTest,TestZeroLengthNoDelimiter)131 TEST_F(HexEncodeTest, TestZeroLengthNoDelimiter) {
132   enc_res_ = hex_encode(encoded_, sizeof(encoded_), "", 0);
133   ASSERT_EQ(0U, enc_res_);
134   dec_res_ = hex_decode(decoded_, sizeof(decoded_), encoded_, enc_res_);
135   ASSERT_EQ(0U, dec_res_);
136 }
137 
138 // Test that we handle a zero-length buffer with a delimiter.
TEST_F(HexEncodeTest,TestZeroLengthWithDelimiter)139 TEST_F(HexEncodeTest, TestZeroLengthWithDelimiter) {
140   enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(encoded_), "", 0, ':');
141   ASSERT_EQ(0U, enc_res_);
142   dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_),
143                                        encoded_, enc_res_, ':');
144   ASSERT_EQ(0U, dec_res_);
145 }
146 
147 // Test the std::string variants that take no delimiter.
TEST_F(HexEncodeTest,TestHelpersNoDelimiter)148 TEST_F(HexEncodeTest, TestHelpersNoDelimiter) {
149   std::string result = hex_encode(data_, sizeof(data_));
150   ASSERT_EQ("80818283848586878889", result);
151   dec_res_ = hex_decode(decoded_, sizeof(decoded_), result);
152   ASSERT_EQ(sizeof(data_), dec_res_);
153   ASSERT_EQ(0, memcmp(data_, decoded_, dec_res_));
154 }
155 
156 // Test the std::string variants that use a delimiter.
TEST_F(HexEncodeTest,TestHelpersWithDelimiter)157 TEST_F(HexEncodeTest, TestHelpersWithDelimiter) {
158   std::string result = hex_encode_with_delimiter(data_, sizeof(data_), ':');
159   ASSERT_EQ("80:81:82:83:84:85:86:87:88:89", result);
160   dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_), result, ':');
161   ASSERT_EQ(sizeof(data_), dec_res_);
162   ASSERT_EQ(0, memcmp(data_, decoded_, dec_res_));
163 }
164 
165 // Test that encoding into a too-small output buffer (without delimiter) fails.
TEST_F(HexEncodeTest,TestEncodeTooShort)166 TEST_F(HexEncodeTest, TestEncodeTooShort) {
167   enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(data_) * 2,
168                                        data_, sizeof(data_), 0);
169   ASSERT_EQ(0U, enc_res_);
170 }
171 
172 // Test that encoding into a too-small output buffer (with delimiter) fails.
TEST_F(HexEncodeTest,TestEncodeWithDelimiterTooShort)173 TEST_F(HexEncodeTest, TestEncodeWithDelimiterTooShort) {
174   enc_res_ = hex_encode_with_delimiter(encoded_, sizeof(data_) * 3 - 1,
175                                        data_, sizeof(data_), ':');
176   ASSERT_EQ(0U, enc_res_);
177 }
178 
179 // Test that decoding into a too-small output buffer fails.
TEST_F(HexEncodeTest,TestDecodeTooShort)180 TEST_F(HexEncodeTest, TestDecodeTooShort) {
181   dec_res_ = hex_decode_with_delimiter(decoded_, 4, "0123456789", 10, 0);
182   ASSERT_EQ(0U, dec_res_);
183   ASSERT_EQ(0x7f, decoded_[4]);
184 }
185 
186 // Test that decoding non-hex data fails.
TEST_F(HexEncodeTest,TestDecodeBogusData)187 TEST_F(HexEncodeTest, TestDecodeBogusData) {
188   dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_), "xyz", 3, 0);
189   ASSERT_EQ(0U, dec_res_);
190 }
191 
192 // Test that decoding an odd number of hex characters fails.
TEST_F(HexEncodeTest,TestDecodeOddHexDigits)193 TEST_F(HexEncodeTest, TestDecodeOddHexDigits) {
194   dec_res_ = hex_decode_with_delimiter(decoded_, sizeof(decoded_), "012", 3, 0);
195   ASSERT_EQ(0U, dec_res_);
196 }
197 
198 // Test that decoding a string with too many delimiters fails.
TEST_F(HexEncodeTest,TestDecodeWithDelimiterTooManyDelimiters)199 TEST_F(HexEncodeTest, TestDecodeWithDelimiterTooManyDelimiters) {
200   dec_res_ = hex_decode_with_delimiter(decoded_, 4, "01::23::45::67", 14, ':');
201   ASSERT_EQ(0U, dec_res_);
202 }
203 
204 // Test that decoding a string with a leading delimiter fails.
TEST_F(HexEncodeTest,TestDecodeWithDelimiterLeadingDelimiter)205 TEST_F(HexEncodeTest, TestDecodeWithDelimiterLeadingDelimiter) {
206   dec_res_ = hex_decode_with_delimiter(decoded_, 4, ":01:23:45:67", 12, ':');
207   ASSERT_EQ(0U, dec_res_);
208 }
209 
210 // Test that decoding a string with a trailing delimiter fails.
TEST_F(HexEncodeTest,TestDecodeWithDelimiterTrailingDelimiter)211 TEST_F(HexEncodeTest, TestDecodeWithDelimiterTrailingDelimiter) {
212   dec_res_ = hex_decode_with_delimiter(decoded_, 4, "01:23:45:67:", 12, ':');
213   ASSERT_EQ(0U, dec_res_);
214 }
215 
216 // Tests counting substrings.
TEST(TokenizeTest,CountSubstrings)217 TEST(TokenizeTest, CountSubstrings) {
218   std::vector<std::string> fields;
219 
220   EXPECT_EQ(5ul, tokenize("one two three four five", ' ', &fields));
221   fields.clear();
222   EXPECT_EQ(1ul, tokenize("one", ' ', &fields));
223 
224   // Extra spaces should be ignored.
225   fields.clear();
226   EXPECT_EQ(5ul, tokenize("  one    two  three    four five  ", ' ', &fields));
227   fields.clear();
228   EXPECT_EQ(1ul, tokenize("  one  ", ' ', &fields));
229   fields.clear();
230   EXPECT_EQ(0ul, tokenize(" ", ' ', &fields));
231 }
232 
233 // Tests comparing substrings.
TEST(TokenizeTest,CompareSubstrings)234 TEST(TokenizeTest, CompareSubstrings) {
235   std::vector<std::string> fields;
236 
237   tokenize("find middle one", ' ', &fields);
238   ASSERT_EQ(3ul, fields.size());
239   ASSERT_STREQ("middle", fields.at(1).c_str());
240   fields.clear();
241 
242   // Extra spaces should be ignored.
243   tokenize("  find   middle  one    ", ' ', &fields);
244   ASSERT_EQ(3ul, fields.size());
245   ASSERT_STREQ("middle", fields.at(1).c_str());
246   fields.clear();
247   tokenize(" ", ' ', &fields);
248   ASSERT_EQ(0ul, fields.size());
249 }
250 
TEST(TokenizeTest,TokenizeAppend)251 TEST(TokenizeTest, TokenizeAppend) {
252   ASSERT_EQ(0ul, tokenize_append("A B C", ' ', NULL));
253 
254   std::vector<std::string> fields;
255 
256   tokenize_append("A B C", ' ', &fields);
257   ASSERT_EQ(3ul, fields.size());
258   ASSERT_STREQ("B", fields.at(1).c_str());
259 
260   tokenize_append("D E", ' ', &fields);
261   ASSERT_EQ(5ul, fields.size());
262   ASSERT_STREQ("B", fields.at(1).c_str());
263   ASSERT_STREQ("E", fields.at(4).c_str());
264 }
265 
TEST(TokenizeTest,TokenizeWithMarks)266 TEST(TokenizeTest, TokenizeWithMarks) {
267   ASSERT_EQ(0ul, tokenize("D \"A B", ' ', '(', ')', NULL));
268 
269   std::vector<std::string> fields;
270   tokenize("A B C", ' ', '"', '"', &fields);
271   ASSERT_EQ(3ul, fields.size());
272   ASSERT_STREQ("C", fields.at(2).c_str());
273 
274   tokenize("\"A B\" C", ' ', '"', '"', &fields);
275   ASSERT_EQ(2ul, fields.size());
276   ASSERT_STREQ("A B", fields.at(0).c_str());
277 
278   tokenize("D \"A B\" C", ' ', '"', '"', &fields);
279   ASSERT_EQ(3ul, fields.size());
280   ASSERT_STREQ("D", fields.at(0).c_str());
281   ASSERT_STREQ("A B", fields.at(1).c_str());
282 
283   tokenize("D \"A B\" C \"E F\"", ' ', '"', '"', &fields);
284   ASSERT_EQ(4ul, fields.size());
285   ASSERT_STREQ("D", fields.at(0).c_str());
286   ASSERT_STREQ("A B", fields.at(1).c_str());
287   ASSERT_STREQ("E F", fields.at(3).c_str());
288 
289   // No matching marks.
290   tokenize("D \"A B", ' ', '"', '"', &fields);
291   ASSERT_EQ(3ul, fields.size());
292   ASSERT_STREQ("D", fields.at(0).c_str());
293   ASSERT_STREQ("\"A", fields.at(1).c_str());
294 
295   tokenize("D (A B) C (E F) G", ' ', '(', ')', &fields);
296   ASSERT_EQ(5ul, fields.size());
297   ASSERT_STREQ("D", fields.at(0).c_str());
298   ASSERT_STREQ("A B", fields.at(1).c_str());
299   ASSERT_STREQ("E F", fields.at(3).c_str());
300 }
301 
TEST(TokenizeTest,TokenizeWithEmptyTokens)302 TEST(TokenizeTest, TokenizeWithEmptyTokens) {
303   std::vector<std::string> fields;
304   EXPECT_EQ(3ul, tokenize_with_empty_tokens("a.b.c", '.', &fields));
305   EXPECT_EQ("a", fields[0]);
306   EXPECT_EQ("b", fields[1]);
307   EXPECT_EQ("c", fields[2]);
308 
309   EXPECT_EQ(3ul, tokenize_with_empty_tokens("..c", '.', &fields));
310   EXPECT_TRUE(fields[0].empty());
311   EXPECT_TRUE(fields[1].empty());
312   EXPECT_EQ("c", fields[2]);
313 
314   EXPECT_EQ(1ul, tokenize_with_empty_tokens("", '.', &fields));
315   EXPECT_TRUE(fields[0].empty());
316 }
317 
TEST(TokenizeFirstTest,NoLeadingSpaces)318 TEST(TokenizeFirstTest, NoLeadingSpaces) {
319   std::string token;
320   std::string rest;
321 
322   ASSERT_TRUE(tokenize_first("A &*${}", ' ', &token, &rest));
323   ASSERT_STREQ("A", token.c_str());
324   ASSERT_STREQ("&*${}", rest.c_str());
325 
326   ASSERT_TRUE(tokenize_first("A B& *${}", ' ', &token, &rest));
327   ASSERT_STREQ("A", token.c_str());
328   ASSERT_STREQ("B& *${}", rest.c_str());
329 
330   ASSERT_TRUE(tokenize_first("A    B& *${}    ", ' ', &token, &rest));
331   ASSERT_STREQ("A", token.c_str());
332   ASSERT_STREQ("B& *${}    ", rest.c_str());
333 }
334 
TEST(TokenizeFirstTest,LeadingSpaces)335 TEST(TokenizeFirstTest, LeadingSpaces) {
336   std::string token;
337   std::string rest;
338 
339   ASSERT_TRUE(tokenize_first("     A B C", ' ', &token, &rest));
340   ASSERT_STREQ("", token.c_str());
341   ASSERT_STREQ("A B C", rest.c_str());
342 
343   ASSERT_TRUE(tokenize_first("     A    B   C    ", ' ', &token, &rest));
344   ASSERT_STREQ("", token.c_str());
345   ASSERT_STREQ("A    B   C    ", rest.c_str());
346 }
347 
TEST(TokenizeFirstTest,SingleToken)348 TEST(TokenizeFirstTest, SingleToken) {
349   std::string token;
350   std::string rest;
351 
352   // In the case where we cannot find delimiter the whole string is a token.
353   ASSERT_FALSE(tokenize_first("ABC", ' ', &token, &rest));
354 
355   ASSERT_TRUE(tokenize_first("ABC    ", ' ', &token, &rest));
356   ASSERT_STREQ("ABC", token.c_str());
357   ASSERT_STREQ("", rest.c_str());
358 
359   ASSERT_TRUE(tokenize_first("    ABC    ", ' ', &token, &rest));
360   ASSERT_STREQ("", token.c_str());
361   ASSERT_STREQ("ABC    ", rest.c_str());
362 }
363 
364 // Tests counting substrings.
TEST(SplitTest,CountSubstrings)365 TEST(SplitTest, CountSubstrings) {
366   std::vector<std::string> fields;
367 
368   EXPECT_EQ(5ul, split("one,two,three,four,five", ',', &fields));
369   fields.clear();
370   EXPECT_EQ(1ul, split("one", ',', &fields));
371 
372   // Empty fields between commas count.
373   fields.clear();
374   EXPECT_EQ(5ul, split("one,,three,four,five", ',', &fields));
375   fields.clear();
376   EXPECT_EQ(3ul, split(",three,", ',', &fields));
377   fields.clear();
378   EXPECT_EQ(1ul, split("", ',', &fields));
379 }
380 
381 // Tests comparing substrings.
TEST(SplitTest,CompareSubstrings)382 TEST(SplitTest, CompareSubstrings) {
383   std::vector<std::string> fields;
384 
385   split("find,middle,one", ',', &fields);
386   ASSERT_EQ(3ul, fields.size());
387   ASSERT_STREQ("middle", fields.at(1).c_str());
388   fields.clear();
389 
390   // Empty fields between commas count.
391   split("find,,middle,one", ',', &fields);
392   ASSERT_EQ(4ul, fields.size());
393   ASSERT_STREQ("middle", fields.at(2).c_str());
394   fields.clear();
395   split("", ',', &fields);
396   ASSERT_EQ(1ul, fields.size());
397   ASSERT_STREQ("", fields.at(0).c_str());
398 }
399 
TEST(BoolTest,DecodeValid)400 TEST(BoolTest, DecodeValid) {
401   bool value;
402   EXPECT_TRUE(FromString("true", &value));
403   EXPECT_TRUE(value);
404   EXPECT_TRUE(FromString("true,", &value));
405   EXPECT_TRUE(value);
406   EXPECT_TRUE(FromString("true , true", &value));
407   EXPECT_TRUE(value);
408   EXPECT_TRUE(FromString("true ,\n false", &value));
409   EXPECT_TRUE(value);
410   EXPECT_TRUE(FromString("  true  \n", &value));
411   EXPECT_TRUE(value);
412 
413   EXPECT_TRUE(FromString("false", &value));
414   EXPECT_FALSE(value);
415   EXPECT_TRUE(FromString("  false ", &value));
416   EXPECT_FALSE(value);
417   EXPECT_TRUE(FromString("  false, ", &value));
418   EXPECT_FALSE(value);
419 
420   EXPECT_TRUE(FromString<bool>("true\n"));
421   EXPECT_FALSE(FromString<bool>("false\n"));
422 }
423 
TEST(BoolTest,DecodeInvalid)424 TEST(BoolTest, DecodeInvalid) {
425   bool value;
426   EXPECT_FALSE(FromString("True", &value));
427   EXPECT_FALSE(FromString("TRUE", &value));
428   EXPECT_FALSE(FromString("False", &value));
429   EXPECT_FALSE(FromString("FALSE", &value));
430   EXPECT_FALSE(FromString("0", &value));
431   EXPECT_FALSE(FromString("1", &value));
432   EXPECT_FALSE(FromString("0,", &value));
433   EXPECT_FALSE(FromString("1,", &value));
434   EXPECT_FALSE(FromString("1,0", &value));
435   EXPECT_FALSE(FromString("1.", &value));
436   EXPECT_FALSE(FromString("1.0", &value));
437   EXPECT_FALSE(FromString("", &value));
438   EXPECT_FALSE(FromString<bool>("false\nfalse"));
439 }
440 
TEST(BoolTest,RoundTrip)441 TEST(BoolTest, RoundTrip) {
442   bool value;
443   EXPECT_TRUE(FromString(ToString(true), &value));
444   EXPECT_TRUE(value);
445   EXPECT_TRUE(FromString(ToString(false), &value));
446   EXPECT_FALSE(value);
447 }
448 
449 }  // namespace rtc
450