diff options
Diffstat (limited to 'src/base')
-rw-r--r-- | src/base/SConscript | 1 | ||||
-rw-r--r-- | src/base/str.hh | 14 | ||||
-rw-r--r-- | src/base/str.test.cc | 459 |
3 files changed, 470 insertions, 4 deletions
diff --git a/src/base/SConscript b/src/base/SConscript index ca8182203..d6615be13 100644 --- a/src/base/SConscript +++ b/src/base/SConscript @@ -71,6 +71,7 @@ if env['TARGET_ISA'] != 'null': Source('socket.cc') Source('statistics.cc') Source('str.cc') +GTest('str.test', 'str.test.cc', 'str.cc') Source('time.cc') Source('trace.cc') GTest('trie.test', 'trie.test.cc') diff --git a/src/base/str.hh b/src/base/str.hh index 1ea18b70d..48fccc8eb 100644 --- a/src/base/str.hh +++ b/src/base/str.hh @@ -85,12 +85,14 @@ to_lower(const std::string &s) } // Split the string s into lhs and rhs on the first occurence of the -// character c. +// character c. Character c is not included in either lhs or rhs. If +// character c is not contained within string s, lsh equals s. bool split_first(const std::string &s, std::string &lhs, std::string &rhs, char c); // Split the string s into lhs and rhs on the last occurence of the -// character c. +// character c. Character c is not included in either lhs or rhs. If +// character c is not contained within string s, lhs equals s. bool split_last(const std::string &s, std::string &lhs, std::string &rhs, char c); @@ -115,8 +117,10 @@ __to_number(const std::string &value) { // start big and narrow it down if needed, determine the base dynamically long long r = std::stoll(value, nullptr, 0); - if (r < std::numeric_limits<T>::min() || r > std::numeric_limits<T>::max()) + if (r < std::numeric_limits<T>::lowest() + || r > std::numeric_limits<T>::max()) { throw std::out_of_range("Out of range"); + } return static_cast<T>(r); } @@ -146,8 +150,10 @@ __to_number(const std::string &value) { // start big and narrow it down if needed long double r = std::stold(value); - if (r < std::numeric_limits<T>::min() || r > std::numeric_limits<T>::max()) + if (r < std::numeric_limits<T>::lowest() + || r > std::numeric_limits<T>::max()) { throw std::out_of_range("Out of range"); + } return static_cast<T>(r); } /** @} */ diff --git a/src/base/str.test.cc b/src/base/str.test.cc new file mode 100644 index 000000000..05af5d7f2 --- /dev/null +++ b/src/base/str.test.cc @@ -0,0 +1,459 @@ +/* + * Copyright (c) 2019 The Regents of the University of California + * All rights reserved + * + * The license below extends only to copyright in the software and shall + * not be construed as granting a license to any other intellectual + * property including but not limited to intellectual property relating + * to a hardware implementation of the functionality of the software + * licensed hereunder. You may use the software subject to the license + * terms below provided that you ensure that this notice is replicated + * unmodified and in its entirety in all distributions of the software, + * modified or unmodified, in source code or in binary form. + * + * Redistribution and use in source and binary forms, with or without + * modification, are permitted provided that the following conditions are + * met: redistributions of source code must retain the above copyright + * notice, this list of conditions and the following disclaimer; + * redistributions in binary form must reproduce the above copyright + * notice, this list of conditions and the following disclaimer in the + * documentation and/or other materials provided with the distribution; + * neither the name of the copyright holders nor the names of its + * contributors may be used to endorse or promote products derived from + * this software without specific prior written permission. + * + * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS + * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT + * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR + * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT + * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, + * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT + * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, + * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY + * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT + * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE + * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + * + * Authors: Bobby R. Bruce + */ + +#include <gtest/gtest.h> + +#include "base/str.hh" + +/* + * str.cc has "eat_lead_white", "eat_end_white", and "eat_white" fucntions to + * remove leading and trailing whitespace. The following tests verify this + * behavior. + */ +TEST(StrTest, EatLeadWhite) +{ + std::string val = " hello there "; + eat_lead_white(val); + EXPECT_EQ("hello there ", val); +} + +TEST(StrTest, EatLeadWhiteNoLeadingWhitespace) +{ + std::string val = "hello there "; + eat_lead_white(val); + EXPECT_EQ("hello there ", val); +} + +TEST(StrTest, EatEndWhite) +{ + std::string val = " hello there "; + eat_end_white(val); + EXPECT_EQ(" hello there", val); +} + +TEST(StrTest, EatEndWhiteNoTrailingWhitespace) +{ + std::string val = " hello there"; + eat_end_white(val); + EXPECT_EQ(" hello there", val); +} + +TEST(StrTest, EatWhite) +{ + std::string val = " hello there "; + eat_white(val); + EXPECT_EQ("hello there", val); +} + +TEST(StrTest, EatWhiteNoWhitespace) +{ + std::string val = "hello there"; + eat_lead_white(val); + EXPECT_EQ("hello there", val); +} + +/* + * This tests checks that str.cc's "to_lower" function converts a string to + * lowercase. + */ +TEST(StrTest, ToLower) +{ + std::string val = "gOoDbYe FOO@barr!"; + to_lower("goodbye foo@bar!"); +} + +/* + * str.cc's "split_first" and "split_last" fucntions split a string on a + * character into two parts. "split_first" splits on the first instance of + * this character and "split_last" splits on the last instance of this + * character. The character itself is not included in either of the output + * right-hand side and left-hand side strings. If the character cannot be + * found in the string then the left-hand side string is equal to the input + * string and the right-hand side string is empty. + */ +TEST(StrTest, SplitFirst) +{ + std::string val = "abcdefg abcdefg"; + std::string lhs; + std::string rhs; + + split_first(val , lhs, rhs, 'f'); + EXPECT_EQ("abcdefg abcdefg", val); + EXPECT_EQ("abcde", lhs); + EXPECT_EQ("g abcdefg", rhs); +} + +TEST(StrTest, SplitFirstNoChar) +{ + std::string val = "abcdefg abcdefg"; + std::string lhs; + std::string rhs; + + split_first(val , lhs, rhs, 'h'); + EXPECT_EQ("abcdefg abcdefg", val); + EXPECT_EQ("abcdefg abcdefg", lhs); + EXPECT_EQ("", rhs); +} + +TEST(StrTest, SplitFirstOnFirstChar) +{ + std::string val = "abcdefg abcdefg"; + std::string lhs; + std::string rhs; + + split_first(val , lhs, rhs, 'a'); + EXPECT_EQ("abcdefg abcdefg", val); + EXPECT_EQ("", lhs); + EXPECT_EQ("bcdefg abcdefg", rhs); +} + +TEST(StrTest, SplitLast) +{ + std::string val = "abcdefg abcdefg"; + std::string lhs; + std::string rhs; + + split_last(val , lhs, rhs, 'f'); + EXPECT_EQ("abcdefg abcdefg", val); + EXPECT_EQ("abcdefg abcde", lhs); + EXPECT_EQ("g", rhs); +} + +TEST(StrTest, SplitLastNoChar) +{ + std::string val = "abcdefg abcdefg"; + std::string lhs; + std::string rhs; + + split_last(val , lhs, rhs, 'h'); + EXPECT_EQ("abcdefg abcdefg", val); + EXPECT_EQ("abcdefg abcdefg", lhs); + EXPECT_EQ("", rhs); +} + +TEST(StrTest, SplitLastOnLastChar) +{ + std::string val = "abcdefg abcdefg"; + std::string lhs; + std::string rhs; + + split_last(val , lhs, rhs, 'g'); + EXPECT_EQ("abcdefg abcdefg", val); + EXPECT_EQ("abcdefg abcdef", lhs); + EXPECT_EQ("", rhs); +} + + +/* + * str.cc's "tokenize" function splits a string into its constituent tokens. + * It splits based on an input character. + */ +TEST(StrTest, TokenizeOnSpace) +{ + /* + * val has a double space between each token with trailing and leading + * whitespace. + */ + std::string val = " Hello, this is a sentence. "; + std::vector<std::string> tokens; + + /* + * By default 'ign' is true. This means empty tokens are not included in + * the output list. + */ + tokenize(tokens, val, ' '); + EXPECT_EQ(" Hello, this is a sentence. ", val); + EXPECT_EQ(5, tokens.size()); + EXPECT_EQ("Hello,", tokens[0]); + EXPECT_EQ("this", tokens[1]); + EXPECT_EQ("is", tokens[2]); + EXPECT_EQ("a", tokens[3]); + EXPECT_EQ("sentence.", tokens[4]); +} + +TEST(StrTest, TokenizeOnSpaceIgnFalse) +{ + /* + * val has a double space between each token with trailing and leading + * whitespace. + */ + std::string val = " Hello, this is a sentence. "; + std::vector<std::string> tokens; + + tokenize(tokens, val, ' ', false); + EXPECT_EQ(" Hello, this is a sentence. ", val); + EXPECT_EQ(11, tokens.size()); + EXPECT_EQ("", tokens[0]); + EXPECT_EQ("Hello,", tokens[1]); + EXPECT_EQ("", tokens[2]); + EXPECT_EQ("this", tokens[3]); + EXPECT_EQ("", tokens[4]); + EXPECT_EQ("is", tokens[5]); + EXPECT_EQ("", tokens[6]); + EXPECT_EQ("a", tokens[7]); + EXPECT_EQ("", tokens[8]); + EXPECT_EQ("sentence.", tokens[9]); + EXPECT_EQ("", tokens[10]); +} + +TEST(StrTest, TokenizedTokenDoesNotExist) +{ + std::string val = "abcdefg"; + std::vector<std::string> tokens; + + tokenize(tokens, val, 'h'); + EXPECT_EQ("abcdefg", val); + EXPECT_EQ(1, tokens.size()); + EXPECT_EQ("abcdefg", tokens[0]); +} + +/* + * str.cc's "to_number" function converts a string to a number. The function + * will return false if this is not possible either because the string + * represents a number out-of-range, or because the string cannot be parsed. + */ +TEST(StrTest, ToNumber8BitInt) +{ + int8_t output; + std::string input = "-128"; + EXPECT_TRUE(to_number(input, output)); + EXPECT_EQ(-128, output); +} + +TEST(StrTest, ToNumber8BitIntStringOutOfRange) +{ + int8_t output; + std::string input = "-129"; + EXPECT_FALSE(to_number(input, output)); +} + +TEST(StrTest, ToNumber8BitIntInvalidString) +{ + int8_t output; + std::string input = "onetwoeight"; + EXPECT_FALSE(to_number(input, output)); +} + +TEST(StrTest, ToNumberUnsigned8BitInt) +{ + uint8_t output; + std::string input = "255"; + EXPECT_TRUE(to_number(input, output)); + EXPECT_EQ(255, output); +} + +TEST(StrTest, ToNumberUnsigned8BitIntNegative) +{ + uint8_t output; + std::string input = "-1"; + EXPECT_FALSE(to_number(input, output)); +} + +TEST(StrTest, ToNumber64BitInt) +{ + int64_t output; + int64_t input_number = 0xFFFFFFFFFFFFFFFF; + std::string input = std::to_string(input_number); + EXPECT_TRUE(to_number(input, output)); + EXPECT_EQ(input_number, output); +} + +TEST(StrTest, ToNumber64BitIntInvalidString) +{ + int64_t output; + std::string input = " "; + EXPECT_FALSE(to_number(input, output)); +} + +TEST(StrTest, ToNumberFloat) +{ + float output; + std::string input = "0.1"; + float expected_output = 0.1; + EXPECT_TRUE(to_number(input, output)); + EXPECT_EQ(expected_output, output); +} + +TEST(StrTest, ToNumberFloatIntegerString) +{ + float output; + std::string input = "10"; + float expected_output = 10.0; + EXPECT_TRUE(to_number(input, output)); + EXPECT_EQ(expected_output, output); +} + +TEST(StrTest, ToNumberFloatNegative) +{ + float output; + std::string input = "-0.1"; + float expected_output = -0.1; + EXPECT_TRUE(to_number(input, output)); + EXPECT_EQ(expected_output, output); +} + +TEST(StrTest, ToNumberDouble) +{ + double output; + std::string input = "0.0001"; + double expected_output = 0.0001; + EXPECT_TRUE(to_number(input, output)); + EXPECT_EQ(expected_output, output); +} + +TEST(StrTest, ToNumberDoubleIntegerString) +{ + double output; + std::string input = "12345"; + double expected_output = 12345.0; + EXPECT_TRUE(to_number(input, output)); + EXPECT_EQ(expected_output, output); +} + +TEST(StrTest, ToNumberDoubleNegative) +{ + double output; + std::string input = "-1.2345"; + double expected_output = -1.2345; + EXPECT_TRUE(to_number(input, output)); + EXPECT_EQ(expected_output, output); +} + +/* + * The "to_bool" function takes a string, "true" or "false" + * (case-insenstive), and sets the second argument to the bool equivilent. + * The function will return false if it cannot parse the string. + */ +TEST(StrTest, ToBoolTrue) +{ + bool output = false; + EXPECT_TRUE(to_bool("TrUe", output)); + EXPECT_TRUE(output); +} + +TEST(StrTest, ToBoolFalse){ + bool output = true; + EXPECT_TRUE(to_bool("fAlSe", output)); + EXPECT_FALSE(output); +} + +TEST(StrTest, ToBoolInvalidInput) +{ + bool output; + EXPECT_FALSE(to_bool("falsify", output)); +} + +/* + * The "quote" function take a string and returns that string quoted (i.e., + * between double-quotes) if the string contains a space. + */ +TEST(StrTest, QuoteStringNoSpace) +{ + EXPECT_EQ("hello", quote("hello")); +} + +TEST(StrTest, QuoteStringWithSpace) +{ + EXPECT_EQ("\"hello world\"", quote("hello world")); +} + +TEST(StrTest, QuoteQuotedString) +{ + /* + * At present, a quoted string can be quoted again. + */ + EXPECT_EQ("\"\"hello world\"\"", quote("\"hello world\"")); +} + +TEST(StrTest, QuoteStringWithTab) +{ + /* + * The "quote" function only works with standard space, not any + * whitepsace. + */ + EXPECT_EQ("hello\tworld", quote("hello\tworld")); +} + +/* + * str.hh has three implementations of "startswith"; a function that takes + * string and a prefix and returns true if the string starts with the prefix. + * One implementation takes two strings, another takes two char*, and the + * third takes a string and a char* as a prefix. + */ +TEST(StrTest, StartswithDoubleStringDoesStartWith) +{ + std::string s = "Hello, how are you?"; + std::string prefix = "Hello"; + EXPECT_TRUE(startswith(s, prefix)); +} + +TEST(StrTest, StartswithDoubleStringDoesNotStartWith) +{ + std::string s = "Hello, how are you?"; + std::string prefix = "ello"; + EXPECT_FALSE(startswith(s, prefix)); +} + +TEST(StrTest, StartswithDoubleCharArrayDoesStartWith) +{ + const char* s = "abcdefg"; + const char* prefix = "ab"; + EXPECT_TRUE(startswith(s, prefix)); +} + +TEST(StrTest, StartswithDoubleCharArrayDoesNotStartWith) +{ + const char* s = " abcdefg"; + const char* prefix = "a"; + EXPECT_FALSE(startswith(s, prefix)); +} + +TEST(StrTest, StartswithStringCharArrayDoesStartWith) +{ + std::string s = "foobarr"; + const char* prefix = "f"; + EXPECT_TRUE(startswith(s, prefix)); +} + +TEST(StrTest, StartswithStringCharArrayDoesNotStartWith) +{ + std::string s = "foobarr"; + const char* prefix = "barr"; + EXPECT_FALSE(startswith(s, prefix)); +}
\ No newline at end of file |