407 lines
10 KiB
C++
407 lines
10 KiB
C++
// Licensed to the Apache Software Foundation (ASF) under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing,
|
|
// software distributed under the License is distributed on an
|
|
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the License for the
|
|
// specific language governing permissions and limitations
|
|
// under the License.
|
|
|
|
#include <gtest/gtest.h>
|
|
#include "butil/string_splitter.h"
|
|
#include <stdlib.h>
|
|
|
|
namespace {
|
|
class StringSplitterTest : public ::testing::Test{
|
|
protected:
|
|
StringSplitterTest(){};
|
|
virtual ~StringSplitterTest(){};
|
|
virtual void SetUp() {
|
|
srand (time(0));
|
|
};
|
|
virtual void TearDown() {
|
|
};
|
|
};
|
|
|
|
|
|
TEST_F(StringSplitterTest, sanity) {
|
|
const char* str = "hello there! man ";
|
|
butil::StringSplitter ss(str, ' ');
|
|
// "hello"
|
|
ASSERT_TRUE(ss != NULL);
|
|
ASSERT_EQ(5ul, ss.length());
|
|
ASSERT_EQ(ss.field(), str);
|
|
|
|
// "there!"
|
|
++ss;
|
|
ASSERT_NE(ss, (void*)NULL);
|
|
ASSERT_EQ(6ul, ss.length());
|
|
ASSERT_EQ(ss.field(), str+6);
|
|
|
|
// "man"
|
|
++ss;
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(3ul, ss.length());
|
|
ASSERT_EQ(ss.field(), str+15);
|
|
|
|
++ss;
|
|
ASSERT_FALSE(ss);
|
|
ASSERT_EQ(0ul, ss.length());
|
|
ASSERT_EQ(ss.field(), str + strlen(str));
|
|
|
|
// consecutive separators are treated as zero-length field inside
|
|
butil::StringSplitter ss2(str, ' ', butil::ALLOW_EMPTY_FIELD);
|
|
|
|
// "hello"
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(5ul, ss2.length());
|
|
ASSERT_FALSE(strncmp(ss2.field(), "hello", ss2.length()));
|
|
|
|
// "there!"
|
|
++ss2;
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(6ul, ss2.length());
|
|
ASSERT_FALSE(strncmp(ss2.field(), "there!", ss2.length()));
|
|
|
|
// ""
|
|
++ss2;
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(0ul, ss2.length());
|
|
ASSERT_EQ(ss2.field(), str+13);
|
|
|
|
// ""
|
|
++ss2;
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(0ul, ss2.length());
|
|
ASSERT_EQ(ss2.field(), str+14);
|
|
|
|
// "man"
|
|
++ss2;
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(3ul, ss2.length());
|
|
ASSERT_EQ(ss2.field(), str+15);
|
|
|
|
++ss2;
|
|
ASSERT_FALSE(ss2);
|
|
ASSERT_EQ(0ul, ss2.length());
|
|
ASSERT_EQ(ss2.field(), str+19);
|
|
}
|
|
|
|
|
|
TEST_F(StringSplitterTest, single_word)
|
|
{
|
|
const char* str = "apple";
|
|
butil::StringSplitter ss(str, ' ');
|
|
// "apple"
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(5ul, ss.length());
|
|
ASSERT_EQ(ss.field(), str);
|
|
|
|
++ss;
|
|
ASSERT_FALSE(ss);
|
|
ASSERT_EQ(0ul, ss.length());
|
|
ASSERT_EQ(ss.field(), str+5);
|
|
}
|
|
|
|
TEST_F(StringSplitterTest, starting_with_separator) {
|
|
const char* str = " apple";
|
|
butil::StringSplitter ss(str, ' ');
|
|
// "apple"
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(5ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "apple", ss.length()));
|
|
|
|
++ss;
|
|
ASSERT_FALSE(ss);
|
|
ASSERT_EQ(0ul, ss.length());
|
|
ASSERT_EQ(ss.field(), str + strlen(str));
|
|
|
|
butil::StringSplitter ss2(str, ' ', butil::ALLOW_EMPTY_FIELD);
|
|
// ""
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(0ul, ss2.length());
|
|
ASSERT_EQ(ss2.field(), str);
|
|
|
|
// ""
|
|
++ss2;
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(0ul, ss2.length());
|
|
ASSERT_EQ(ss2.field(), str+1);
|
|
|
|
// "apple"
|
|
++ss2;
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(5ul, ss2.length());
|
|
ASSERT_FALSE(strncmp(ss2.field(), "apple", ss2.length()));
|
|
|
|
++ss2;
|
|
ASSERT_FALSE(ss2);
|
|
ASSERT_EQ(0ul, ss2.length());
|
|
ASSERT_EQ(ss2.field(), str + strlen(str));
|
|
}
|
|
|
|
TEST_F(StringSplitterTest, site_id_as_example) {
|
|
const char* str = "|123|12||1|21|4321";
|
|
butil::StringSplitter ss(str, '|');
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(3ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "123", ss.length()));
|
|
|
|
ss++;
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(2ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "12", ss.length()));
|
|
|
|
ss++;
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(1ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "1", ss.length()));
|
|
|
|
ss++;
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(2ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "21", ss.length()));
|
|
|
|
ss++;
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(4ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "4321", ss.length()));
|
|
|
|
++ss;
|
|
ASSERT_FALSE(ss);
|
|
ASSERT_EQ(0ul, ss.length());
|
|
ASSERT_EQ(ss.field(), str + strlen(str));
|
|
}
|
|
|
|
TEST_F(StringSplitterTest, number_list) {
|
|
const char* str = " 123,,12,1, 21 4321\00056";
|
|
butil::StringMultiSplitter ss(str, ", ");
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(3ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "123", ss.length()));
|
|
|
|
ss++;
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(2ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "12", ss.length()));
|
|
|
|
ss++;
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(1ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "1", ss.length()));
|
|
|
|
ss++;
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(2ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "21", ss.length()));
|
|
|
|
ss++;
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(4ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "4321", ss.length()));
|
|
|
|
++ss;
|
|
ASSERT_FALSE(ss);
|
|
ASSERT_EQ(0ul, ss.length());
|
|
ASSERT_EQ(ss.field(), str + strlen(str));
|
|
|
|
// contains embedded '\0'
|
|
const size_t str_len = 23;
|
|
butil::StringMultiSplitter ss2(str, str + str_len, ", ");
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(3ul, ss2.length());
|
|
ASSERT_FALSE(strncmp(ss2.field(), "123", ss2.length()));
|
|
|
|
ss2++;
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(2ul, ss2.length());
|
|
ASSERT_FALSE(strncmp(ss2.field(), "12", ss2.length()));
|
|
|
|
ss2++;
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(1ul, ss2.length());
|
|
ASSERT_FALSE(strncmp(ss2.field(), "1", ss2.length()));
|
|
|
|
ss2++;
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(2ul, ss2.length());
|
|
ASSERT_FALSE(strncmp(ss2.field(), "21", ss2.length()));
|
|
|
|
ss2++;
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(7ul, ss2.length());
|
|
ASSERT_FALSE(strncmp(ss2.field(), "4321\00056", ss2.length()));
|
|
|
|
++ss2;
|
|
ASSERT_FALSE(ss2);
|
|
ASSERT_EQ(0ul, ss2.length());
|
|
ASSERT_EQ(ss2.field(), str + str_len);
|
|
}
|
|
|
|
TEST_F(StringSplitterTest, cast_type) {
|
|
const char* str = "-1\t123\t111\t1\t10\t11\t1.3\t3.1415926\t127\t128\t256";
|
|
int i = 0;
|
|
unsigned int u = 0;
|
|
long l = 0;
|
|
unsigned long ul = 0;
|
|
long long ll = 0;
|
|
unsigned long long ull = 0;
|
|
float f = 0.0;
|
|
double d = 0.0;
|
|
|
|
butil::StringSplitter ss(str, '\t');
|
|
ASSERT_TRUE(ss);
|
|
|
|
ASSERT_EQ(0, ss.to_int(&i));
|
|
ASSERT_EQ(-1, i);
|
|
|
|
ASSERT_TRUE(++ss);
|
|
ASSERT_EQ(0, ss.to_uint(&u));
|
|
ASSERT_EQ(123u, u);
|
|
|
|
ASSERT_TRUE(++ss);
|
|
ASSERT_EQ(0, ss.to_long(&l));
|
|
ASSERT_EQ(111, l);
|
|
|
|
|
|
ASSERT_TRUE(++ss);
|
|
ASSERT_EQ(0, ss.to_ulong(&ul));
|
|
ASSERT_EQ(1ul, ul);
|
|
|
|
ASSERT_TRUE(++ss);
|
|
ASSERT_EQ(0, ss.to_longlong(&ll));
|
|
ASSERT_EQ(10, ll);
|
|
|
|
ASSERT_TRUE(++ss);
|
|
ASSERT_EQ(0, ss.to_ulonglong(&ull));
|
|
ASSERT_EQ(11ull, ull);
|
|
|
|
ASSERT_TRUE(++ss);
|
|
ASSERT_EQ(0, ss.to_float(&f));
|
|
ASSERT_FLOAT_EQ(1.3, f);
|
|
|
|
ASSERT_TRUE(++ss);
|
|
ASSERT_EQ(0, ss.to_double(&d));
|
|
ASSERT_DOUBLE_EQ(3.1415926, d);
|
|
|
|
ASSERT_TRUE(++ss);
|
|
int8_t c = 0;
|
|
ASSERT_EQ(0, ss.to_int8(&c));
|
|
ASSERT_EQ(127, c);
|
|
|
|
ASSERT_TRUE(++ss);
|
|
uint8_t uc = 0;
|
|
ASSERT_EQ(0, ss.to_uint8(&uc));
|
|
ASSERT_EQ(128U, uc);
|
|
|
|
ASSERT_TRUE(++ss);
|
|
ASSERT_EQ(-1, ss.to_uint8(&uc));
|
|
}
|
|
|
|
TEST_F(StringSplitterTest, split_limit_len) {
|
|
const char* str = "1\t1\0003\t111\t1\t10\t11\t1.3\t3.1415926";
|
|
butil::StringSplitter ss(str, str + 5, '\t');
|
|
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(1ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "1", ss.length()));
|
|
|
|
++ss;
|
|
ASSERT_TRUE(ss);
|
|
ASSERT_EQ(3ul, ss.length());
|
|
ASSERT_FALSE(strncmp(ss.field(), "1\0003", ss.length()));
|
|
|
|
++ss;
|
|
ASSERT_FALSE(ss);
|
|
|
|
// Allows using '\0' as separator
|
|
butil::StringSplitter ss2(str, str + 5, '\0');
|
|
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(3ul, ss2.length());
|
|
ASSERT_FALSE(strncmp(ss2.field(), "1\t1", ss2.length()));
|
|
|
|
++ss2;
|
|
ASSERT_TRUE(ss2);
|
|
ASSERT_EQ(1ul, ss2.length());
|
|
ASSERT_FALSE(strncmp(ss2.field(), "3", ss2.length()));
|
|
|
|
++ss2;
|
|
ASSERT_FALSE(ss2);
|
|
|
|
butil::StringPiece sp(str, 5);
|
|
// Allows using '\0' as separator
|
|
butil::StringSplitter ss3(sp, '\0');
|
|
|
|
ASSERT_TRUE(ss3);
|
|
ASSERT_EQ(3ul, ss3.length());
|
|
ASSERT_FALSE(strncmp(ss3.field(), "1\t1", ss3.length()));
|
|
|
|
++ss3;
|
|
ASSERT_TRUE(ss3);
|
|
ASSERT_EQ(1ul, ss3.length());
|
|
ASSERT_FALSE(strncmp(ss3.field(), "3", ss3.length()));
|
|
|
|
++ss3;
|
|
ASSERT_FALSE(ss3);
|
|
}
|
|
|
|
TEST_F(StringSplitterTest, key_value_pairs_splitter_sanity) {
|
|
std::string kvstr = "key1=value1&&&key2=value2&key3=value3&===&key4=&=&=value5";
|
|
for (int i = 0 ; i < 3; ++i) {
|
|
// Test three constructors
|
|
butil::KeyValuePairsSplitter* psplitter = NULL;
|
|
if (i == 0) {
|
|
psplitter = new butil::KeyValuePairsSplitter(kvstr, '&', '=');
|
|
} else if (i == 1) {
|
|
psplitter = new butil::KeyValuePairsSplitter(
|
|
kvstr.data(), kvstr.data() + kvstr.size(), '&', '=');
|
|
} else if (i == 2) {
|
|
psplitter = new butil::KeyValuePairsSplitter(kvstr.c_str(), '&', '=');
|
|
}
|
|
butil::KeyValuePairsSplitter& splitter = *psplitter;
|
|
|
|
ASSERT_TRUE(splitter);
|
|
ASSERT_EQ(splitter.key(), "key1");
|
|
ASSERT_EQ(splitter.value(), "value1");
|
|
++splitter;
|
|
ASSERT_TRUE(splitter);
|
|
ASSERT_EQ(splitter.key(), "key2");
|
|
ASSERT_EQ(splitter.value(), "value2");
|
|
++splitter;
|
|
ASSERT_TRUE(splitter);
|
|
ASSERT_EQ(splitter.key(), "key3");
|
|
ASSERT_EQ(splitter.value(), "value3");
|
|
++splitter;
|
|
ASSERT_TRUE(splitter);
|
|
ASSERT_EQ(splitter.key(), "");
|
|
ASSERT_EQ(splitter.value(), "==");
|
|
++splitter;
|
|
ASSERT_TRUE(splitter);
|
|
ASSERT_EQ(splitter.key(), "key4");
|
|
ASSERT_EQ(splitter.value(), "");
|
|
++splitter;
|
|
ASSERT_TRUE(splitter);
|
|
ASSERT_EQ(splitter.key(), "");
|
|
ASSERT_EQ(splitter.value(), "");
|
|
++splitter;
|
|
ASSERT_TRUE(splitter);
|
|
ASSERT_EQ(splitter.key(), "");
|
|
ASSERT_EQ(splitter.value(), "value5");
|
|
++splitter;
|
|
ASSERT_FALSE(splitter);
|
|
|
|
delete psplitter;
|
|
}
|
|
}
|
|
|
|
}
|