361 lines
		
	
	
	
		
			12 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			361 lines
		
	
	
	
		
			12 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| // Copyright 2017 The Abseil Authors.
 | |
| //
 | |
| // Licensed under the Apache License, Version 2.0 (the "License");
 | |
| // you may not use this file except in compliance with the License.
 | |
| // You may obtain a copy of the License at
 | |
| //
 | |
| //      https://www.apache.org/licenses/LICENSE-2.0
 | |
| //
 | |
| // Unless required by applicable law or agreed to in writing, software
 | |
| // distributed under the License is distributed on an "AS IS" BASIS,
 | |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | |
| // See the License for the specific language governing permissions and
 | |
| // limitations under the License.
 | |
| 
 | |
| #include "absl/strings/ascii.h"
 | |
| 
 | |
| #include <cctype>
 | |
| #include <clocale>
 | |
| #include <cstring>
 | |
| #include <string>
 | |
| 
 | |
| #include "gtest/gtest.h"
 | |
| #include "absl/base/macros.h"
 | |
| #include "absl/base/port.h"
 | |
| 
 | |
| namespace {
 | |
| 
 | |
| TEST(AsciiIsFoo, All) {
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if ((i >= 'a' && i <= 'z') || (i >= 'A' && i <= 'Z'))
 | |
|       EXPECT_TRUE(absl::ascii_isalpha(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_isalpha(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if ((i >= '0' && i <= '9'))
 | |
|       EXPECT_TRUE(absl::ascii_isdigit(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_isdigit(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if (absl::ascii_isalpha(i) || absl::ascii_isdigit(i))
 | |
|       EXPECT_TRUE(absl::ascii_isalnum(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_isalnum(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if (i != '\0' && strchr(" \r\n\t\v\f", i))
 | |
|       EXPECT_TRUE(absl::ascii_isspace(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_isspace(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if (i >= 32 && i < 127)
 | |
|       EXPECT_TRUE(absl::ascii_isprint(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_isprint(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if (absl::ascii_isprint(i) && !absl::ascii_isspace(i) &&
 | |
|         !absl::ascii_isalnum(i))
 | |
|       EXPECT_TRUE(absl::ascii_ispunct(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_ispunct(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if (i == ' ' || i == '\t')
 | |
|       EXPECT_TRUE(absl::ascii_isblank(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_isblank(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if (i < 32 || i == 127)
 | |
|       EXPECT_TRUE(absl::ascii_iscntrl(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_iscntrl(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if (absl::ascii_isdigit(i) || (i >= 'A' && i <= 'F') ||
 | |
|         (i >= 'a' && i <= 'f'))
 | |
|       EXPECT_TRUE(absl::ascii_isxdigit(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_isxdigit(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if (i > 32 && i < 127)
 | |
|       EXPECT_TRUE(absl::ascii_isgraph(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_isgraph(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if (i >= 'A' && i <= 'Z')
 | |
|       EXPECT_TRUE(absl::ascii_isupper(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_isupper(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if (i >= 'a' && i <= 'z')
 | |
|       EXPECT_TRUE(absl::ascii_islower(i)) << ": failed on " << i;
 | |
|     else
 | |
|       EXPECT_TRUE(!absl::ascii_islower(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 0; i < 128; i++) {
 | |
|     EXPECT_TRUE(absl::ascii_isascii(i)) << ": failed on " << i;
 | |
|   }
 | |
|   for (int i = 128; i < 256; i++) {
 | |
|     EXPECT_TRUE(!absl::ascii_isascii(i)) << ": failed on " << i;
 | |
|   }
 | |
| 
 | |
|   // The official is* functions don't accept negative signed chars, but
 | |
|   // our absl::ascii_is* functions do.
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     signed char sc = static_cast<signed char>(static_cast<unsigned char>(i));
 | |
|     EXPECT_EQ(absl::ascii_isalpha(i), absl::ascii_isalpha(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_isdigit(i), absl::ascii_isdigit(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_isalnum(i), absl::ascii_isalnum(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_isspace(i), absl::ascii_isspace(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_ispunct(i), absl::ascii_ispunct(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_isblank(i), absl::ascii_isblank(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_iscntrl(i), absl::ascii_iscntrl(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_isxdigit(i), absl::ascii_isxdigit(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_isprint(i), absl::ascii_isprint(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_isgraph(i), absl::ascii_isgraph(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_isupper(i), absl::ascii_isupper(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_islower(i), absl::ascii_islower(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_isascii(i), absl::ascii_isascii(sc)) << i;
 | |
|   }
 | |
| }
 | |
| 
 | |
| // Checks that absl::ascii_isfoo returns the same value as isfoo in the C
 | |
| // locale.
 | |
| TEST(AsciiIsFoo, SameAsIsFoo) {
 | |
| #ifndef __ANDROID__
 | |
|   // temporarily change locale to C. It should already be C, but just for safety
 | |
|   const char* old_locale = setlocale(LC_CTYPE, "C");
 | |
|   ASSERT_TRUE(old_locale != nullptr);
 | |
| #endif
 | |
| 
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     EXPECT_EQ(isalpha(i) != 0, absl::ascii_isalpha(i)) << i;
 | |
|     EXPECT_EQ(isdigit(i) != 0, absl::ascii_isdigit(i)) << i;
 | |
|     EXPECT_EQ(isalnum(i) != 0, absl::ascii_isalnum(i)) << i;
 | |
|     EXPECT_EQ(isspace(i) != 0, absl::ascii_isspace(i)) << i;
 | |
|     EXPECT_EQ(ispunct(i) != 0, absl::ascii_ispunct(i)) << i;
 | |
|     EXPECT_EQ(isblank(i) != 0, absl::ascii_isblank(i)) << i;
 | |
|     EXPECT_EQ(iscntrl(i) != 0, absl::ascii_iscntrl(i)) << i;
 | |
|     EXPECT_EQ(isxdigit(i) != 0, absl::ascii_isxdigit(i)) << i;
 | |
|     EXPECT_EQ(isprint(i) != 0, absl::ascii_isprint(i)) << i;
 | |
|     EXPECT_EQ(isgraph(i) != 0, absl::ascii_isgraph(i)) << i;
 | |
|     EXPECT_EQ(isupper(i) != 0, absl::ascii_isupper(i)) << i;
 | |
|     EXPECT_EQ(islower(i) != 0, absl::ascii_islower(i)) << i;
 | |
|     EXPECT_EQ(isascii(i) != 0, absl::ascii_isascii(i)) << i;
 | |
|   }
 | |
| 
 | |
| #ifndef __ANDROID__
 | |
|   // restore the old locale.
 | |
|   ASSERT_TRUE(setlocale(LC_CTYPE, old_locale));
 | |
| #endif
 | |
| }
 | |
| 
 | |
| TEST(AsciiToFoo, All) {
 | |
| #ifndef __ANDROID__
 | |
|   // temporarily change locale to C. It should already be C, but just for safety
 | |
|   const char* old_locale = setlocale(LC_CTYPE, "C");
 | |
|   ASSERT_TRUE(old_locale != nullptr);
 | |
| #endif
 | |
| 
 | |
|   for (int i = 0; i < 256; i++) {
 | |
|     if (absl::ascii_islower(i))
 | |
|       EXPECT_EQ(absl::ascii_toupper(i), 'A' + (i - 'a')) << i;
 | |
|     else
 | |
|       EXPECT_EQ(absl::ascii_toupper(i), static_cast<char>(i)) << i;
 | |
| 
 | |
|     if (absl::ascii_isupper(i))
 | |
|       EXPECT_EQ(absl::ascii_tolower(i), 'a' + (i - 'A')) << i;
 | |
|     else
 | |
|       EXPECT_EQ(absl::ascii_tolower(i), static_cast<char>(i)) << i;
 | |
| 
 | |
|     // These CHECKs only hold in a C locale.
 | |
|     EXPECT_EQ(static_cast<char>(tolower(i)), absl::ascii_tolower(i)) << i;
 | |
|     EXPECT_EQ(static_cast<char>(toupper(i)), absl::ascii_toupper(i)) << i;
 | |
| 
 | |
|     // The official to* functions don't accept negative signed chars, but
 | |
|     // our absl::ascii_to* functions do.
 | |
|     signed char sc = static_cast<signed char>(static_cast<unsigned char>(i));
 | |
|     EXPECT_EQ(absl::ascii_tolower(i), absl::ascii_tolower(sc)) << i;
 | |
|     EXPECT_EQ(absl::ascii_toupper(i), absl::ascii_toupper(sc)) << i;
 | |
|   }
 | |
| #ifndef __ANDROID__
 | |
|   // restore the old locale.
 | |
|   ASSERT_TRUE(setlocale(LC_CTYPE, old_locale));
 | |
| #endif
 | |
| }
 | |
| 
 | |
| TEST(AsciiStrTo, Lower) {
 | |
|   const char buf[] = "ABCDEF";
 | |
|   const std::string str("GHIJKL");
 | |
|   const std::string str2("MNOPQR");
 | |
|   const absl::string_view sp(str2);
 | |
| 
 | |
|   EXPECT_EQ("abcdef", absl::AsciiStrToLower(buf));
 | |
|   EXPECT_EQ("ghijkl", absl::AsciiStrToLower(str));
 | |
|   EXPECT_EQ("mnopqr", absl::AsciiStrToLower(sp));
 | |
| 
 | |
|   char mutable_buf[] = "Mutable";
 | |
|   std::transform(mutable_buf, mutable_buf + strlen(mutable_buf),
 | |
|                  mutable_buf, absl::ascii_tolower);
 | |
|   EXPECT_STREQ("mutable", mutable_buf);
 | |
| }
 | |
| 
 | |
| TEST(AsciiStrTo, Upper) {
 | |
|   const char buf[] = "abcdef";
 | |
|   const std::string str("ghijkl");
 | |
|   const std::string str2("mnopqr");
 | |
|   const absl::string_view sp(str2);
 | |
| 
 | |
|   EXPECT_EQ("ABCDEF", absl::AsciiStrToUpper(buf));
 | |
|   EXPECT_EQ("GHIJKL", absl::AsciiStrToUpper(str));
 | |
|   EXPECT_EQ("MNOPQR", absl::AsciiStrToUpper(sp));
 | |
| 
 | |
|   char mutable_buf[] = "Mutable";
 | |
|   std::transform(mutable_buf, mutable_buf + strlen(mutable_buf),
 | |
|                  mutable_buf, absl::ascii_toupper);
 | |
|   EXPECT_STREQ("MUTABLE", mutable_buf);
 | |
| }
 | |
| 
 | |
| TEST(StripLeadingAsciiWhitespace, FromStringView) {
 | |
|   EXPECT_EQ(absl::string_view{},
 | |
|             absl::StripLeadingAsciiWhitespace(absl::string_view{}));
 | |
|   EXPECT_EQ("foo", absl::StripLeadingAsciiWhitespace({"foo"}));
 | |
|   EXPECT_EQ("foo", absl::StripLeadingAsciiWhitespace({"\t  \n\f\r\n\vfoo"}));
 | |
|   EXPECT_EQ("foo foo\n ",
 | |
|             absl::StripLeadingAsciiWhitespace({"\t  \n\f\r\n\vfoo foo\n "}));
 | |
|   EXPECT_EQ(absl::string_view{}, absl::StripLeadingAsciiWhitespace(
 | |
|                                      {"\t  \n\f\r\v\n\t  \n\f\r\v\n"}));
 | |
| }
 | |
| 
 | |
| TEST(StripLeadingAsciiWhitespace, InPlace) {
 | |
|   std::string str;
 | |
| 
 | |
|   absl::StripLeadingAsciiWhitespace(&str);
 | |
|   EXPECT_EQ("", str);
 | |
| 
 | |
|   str = "foo";
 | |
|   absl::StripLeadingAsciiWhitespace(&str);
 | |
|   EXPECT_EQ("foo", str);
 | |
| 
 | |
|   str = "\t  \n\f\r\n\vfoo";
 | |
|   absl::StripLeadingAsciiWhitespace(&str);
 | |
|   EXPECT_EQ("foo", str);
 | |
| 
 | |
|   str = "\t  \n\f\r\n\vfoo foo\n ";
 | |
|   absl::StripLeadingAsciiWhitespace(&str);
 | |
|   EXPECT_EQ("foo foo\n ", str);
 | |
| 
 | |
|   str = "\t  \n\f\r\v\n\t  \n\f\r\v\n";
 | |
|   absl::StripLeadingAsciiWhitespace(&str);
 | |
|   EXPECT_EQ(absl::string_view{}, str);
 | |
| }
 | |
| 
 | |
| TEST(StripTrailingAsciiWhitespace, FromStringView) {
 | |
|   EXPECT_EQ(absl::string_view{},
 | |
|             absl::StripTrailingAsciiWhitespace(absl::string_view{}));
 | |
|   EXPECT_EQ("foo", absl::StripTrailingAsciiWhitespace({"foo"}));
 | |
|   EXPECT_EQ("foo", absl::StripTrailingAsciiWhitespace({"foo\t  \n\f\r\n\v"}));
 | |
|   EXPECT_EQ(" \nfoo foo",
 | |
|             absl::StripTrailingAsciiWhitespace({" \nfoo foo\t  \n\f\r\n\v"}));
 | |
|   EXPECT_EQ(absl::string_view{}, absl::StripTrailingAsciiWhitespace(
 | |
|                                      {"\t  \n\f\r\v\n\t  \n\f\r\v\n"}));
 | |
| }
 | |
| 
 | |
| TEST(StripTrailingAsciiWhitespace, InPlace) {
 | |
|   std::string str;
 | |
| 
 | |
|   absl::StripTrailingAsciiWhitespace(&str);
 | |
|   EXPECT_EQ("", str);
 | |
| 
 | |
|   str = "foo";
 | |
|   absl::StripTrailingAsciiWhitespace(&str);
 | |
|   EXPECT_EQ("foo", str);
 | |
| 
 | |
|   str = "foo\t  \n\f\r\n\v";
 | |
|   absl::StripTrailingAsciiWhitespace(&str);
 | |
|   EXPECT_EQ("foo", str);
 | |
| 
 | |
|   str = " \nfoo foo\t  \n\f\r\n\v";
 | |
|   absl::StripTrailingAsciiWhitespace(&str);
 | |
|   EXPECT_EQ(" \nfoo foo", str);
 | |
| 
 | |
|   str = "\t  \n\f\r\v\n\t  \n\f\r\v\n";
 | |
|   absl::StripTrailingAsciiWhitespace(&str);
 | |
|   EXPECT_EQ(absl::string_view{}, str);
 | |
| }
 | |
| 
 | |
| TEST(StripAsciiWhitespace, FromStringView) {
 | |
|   EXPECT_EQ(absl::string_view{},
 | |
|             absl::StripAsciiWhitespace(absl::string_view{}));
 | |
|   EXPECT_EQ("foo", absl::StripAsciiWhitespace({"foo"}));
 | |
|   EXPECT_EQ("foo",
 | |
|             absl::StripAsciiWhitespace({"\t  \n\f\r\n\vfoo\t  \n\f\r\n\v"}));
 | |
|   EXPECT_EQ("foo foo", absl::StripAsciiWhitespace(
 | |
|                            {"\t  \n\f\r\n\vfoo foo\t  \n\f\r\n\v"}));
 | |
|   EXPECT_EQ(absl::string_view{},
 | |
|             absl::StripAsciiWhitespace({"\t  \n\f\r\v\n\t  \n\f\r\v\n"}));
 | |
| }
 | |
| 
 | |
| TEST(StripAsciiWhitespace, InPlace) {
 | |
|   std::string str;
 | |
| 
 | |
|   absl::StripAsciiWhitespace(&str);
 | |
|   EXPECT_EQ("", str);
 | |
| 
 | |
|   str = "foo";
 | |
|   absl::StripAsciiWhitespace(&str);
 | |
|   EXPECT_EQ("foo", str);
 | |
| 
 | |
|   str = "\t  \n\f\r\n\vfoo\t  \n\f\r\n\v";
 | |
|   absl::StripAsciiWhitespace(&str);
 | |
|   EXPECT_EQ("foo", str);
 | |
| 
 | |
|   str = "\t  \n\f\r\n\vfoo foo\t  \n\f\r\n\v";
 | |
|   absl::StripAsciiWhitespace(&str);
 | |
|   EXPECT_EQ("foo foo", str);
 | |
| 
 | |
|   str = "\t  \n\f\r\v\n\t  \n\f\r\v\n";
 | |
|   absl::StripAsciiWhitespace(&str);
 | |
|   EXPECT_EQ(absl::string_view{}, str);
 | |
| }
 | |
| 
 | |
| TEST(RemoveExtraAsciiWhitespace, InPlace) {
 | |
|   const char* inputs[] = {"No extra space",
 | |
|                           "  Leading whitespace",
 | |
|                           "Trailing whitespace  ",
 | |
|                           "  Leading and trailing  ",
 | |
|                           " Whitespace \t  in\v   middle  ",
 | |
|                           "'Eeeeep!  \n Newlines!\n",
 | |
|                           "nospaces",
 | |
|                           "",
 | |
|                           "\n\t a\t\n\nb \t\n"};
 | |
| 
 | |
|   const char* outputs[] = {
 | |
|       "No extra space",
 | |
|       "Leading whitespace",
 | |
|       "Trailing whitespace",
 | |
|       "Leading and trailing",
 | |
|       "Whitespace in middle",
 | |
|       "'Eeeeep! Newlines!",
 | |
|       "nospaces",
 | |
|       "",
 | |
|       "a\nb",
 | |
|   };
 | |
|   const int NUM_TESTS = ABSL_ARRAYSIZE(inputs);
 | |
| 
 | |
|   for (int i = 0; i < NUM_TESTS; i++) {
 | |
|     std::string s(inputs[i]);
 | |
|     absl::RemoveExtraAsciiWhitespace(&s);
 | |
|     EXPECT_EQ(outputs[i], s);
 | |
|   }
 | |
| }
 | |
| 
 | |
| }  // namespace
 |