2018-03-06 17:41:18 +00:00
|
|
|
|
#include <gtest/gtest.h>
|
|
|
|
|
|
|
|
|
|
#include <base/system.h>
|
|
|
|
|
|
|
|
|
|
TEST(Str, Dist)
|
|
|
|
|
{
|
|
|
|
|
EXPECT_EQ(str_utf8_dist("aaa", "aaa"), 0);
|
|
|
|
|
EXPECT_EQ(str_utf8_dist("123", "123"), 0);
|
|
|
|
|
EXPECT_EQ(str_utf8_dist("", ""), 0);
|
|
|
|
|
EXPECT_EQ(str_utf8_dist("a", "b"), 1);
|
|
|
|
|
EXPECT_EQ(str_utf8_dist("", "aaa"), 3);
|
|
|
|
|
EXPECT_EQ(str_utf8_dist("123", ""), 3);
|
|
|
|
|
EXPECT_EQ(str_utf8_dist("ä", ""), 1);
|
|
|
|
|
EXPECT_EQ(str_utf8_dist("Hëllö", "Hello"), 2);
|
|
|
|
|
// https://en.wikipedia.org/w/index.php?title=Levenshtein_distance&oldid=828480025#Example
|
|
|
|
|
EXPECT_EQ(str_utf8_dist("kitten", "sitting"), 3);
|
|
|
|
|
EXPECT_EQ(str_utf8_dist("flaw", "lawn"), 2);
|
|
|
|
|
EXPECT_EQ(str_utf8_dist("saturday", "sunday"), 3);
|
|
|
|
|
}
|
2018-03-14 01:27:15 +00:00
|
|
|
|
|
|
|
|
|
TEST(Str, Utf8Isspace)
|
|
|
|
|
{
|
2018-03-14 02:04:41 +00:00
|
|
|
|
EXPECT_TRUE(str_utf8_isspace(0x200b)); // Zero-width space
|
2018-03-14 01:27:15 +00:00
|
|
|
|
EXPECT_TRUE(str_utf8_isspace(' '));
|
|
|
|
|
EXPECT_FALSE(str_utf8_isspace('a'));
|
2018-03-14 02:04:41 +00:00
|
|
|
|
// Control characters.
|
|
|
|
|
for(char c = 0; c < 0x20; c++)
|
|
|
|
|
{
|
|
|
|
|
EXPECT_TRUE(str_utf8_isspace(c));
|
|
|
|
|
}
|
2018-03-14 01:27:15 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
TEST(Str, Utf8SkipWhitespaces)
|
|
|
|
|
{
|
|
|
|
|
EXPECT_STREQ(str_utf8_skip_whitespaces("abc"), "abc");
|
|
|
|
|
EXPECT_STREQ(str_utf8_skip_whitespaces("abc "), "abc ");
|
|
|
|
|
EXPECT_STREQ(str_utf8_skip_whitespaces(" abc"), "abc");
|
2018-03-14 02:04:41 +00:00
|
|
|
|
EXPECT_STREQ(str_utf8_skip_whitespaces("\xe2\x80\x8b abc"), "abc");
|
2018-03-14 01:27:15 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
TEST(Str, Utf8TrimRight)
|
|
|
|
|
{
|
|
|
|
|
char A1[] = "abc"; str_utf8_trim_right(A1); EXPECT_STREQ(A1, "abc");
|
|
|
|
|
char A2[] = " abc"; str_utf8_trim_right(A2); EXPECT_STREQ(A2, " abc");
|
|
|
|
|
char A3[] = "abc "; str_utf8_trim_right(A3); EXPECT_STREQ(A3, "abc");
|
2018-03-14 02:04:41 +00:00
|
|
|
|
char A4[] = "abc \xe2\x80\x8b"; str_utf8_trim_right(A4); EXPECT_STREQ(A4, "abc");
|
2018-03-14 01:27:15 +00:00
|
|
|
|
}
|
2018-03-20 20:11:44 +00:00
|
|
|
|
|
|
|
|
|
TEST(Str, Utf8CompConfusables)
|
|
|
|
|
{
|
|
|
|
|
EXPECT_TRUE(str_utf8_comp_confusable("abc", "abc") == 0);
|
|
|
|
|
EXPECT_TRUE(str_utf8_comp_confusable("rn", "m") == 0);
|
|
|
|
|
EXPECT_TRUE(str_utf8_comp_confusable("l", "ӏ") == 0); // CYRILLIC SMALL LETTER PALOCHKA
|
|
|
|
|
EXPECT_FALSE(str_utf8_comp_confusable("o", "x") == 0);
|
|
|
|
|
EXPECT_TRUE(str_utf8_comp_confusable("aceiou", "ąçęįǫų") == 0);
|
|
|
|
|
}
|
2018-07-25 08:23:07 +00:00
|
|
|
|
|
|
|
|
|
TEST(Str, Startswith)
|
|
|
|
|
{
|
|
|
|
|
EXPECT_TRUE(str_startswith("abcdef", "abc"));
|
|
|
|
|
EXPECT_FALSE(str_startswith("abc", "abcdef"));
|
|
|
|
|
|
|
|
|
|
EXPECT_TRUE(str_startswith("xyz", ""));
|
|
|
|
|
EXPECT_FALSE(str_startswith("", "xyz"));
|
|
|
|
|
|
|
|
|
|
EXPECT_FALSE(str_startswith("house", "home"));
|
|
|
|
|
EXPECT_FALSE(str_startswith("blackboard", "board"));
|
|
|
|
|
|
|
|
|
|
EXPECT_TRUE(str_startswith("поплавать", "по"));
|
|
|
|
|
EXPECT_FALSE(str_startswith("плавать", "по"));
|
|
|
|
|
|
|
|
|
|
static const char ABCDEF[] = "abcdef";
|
|
|
|
|
static const char ABC[] = "abc";
|
|
|
|
|
EXPECT_EQ(str_startswith(ABCDEF, ABC) - ABCDEF, str_length(ABC));
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
TEST(Str, Endswith)
|
|
|
|
|
{
|
|
|
|
|
EXPECT_TRUE(str_endswith("abcdef", "def"));
|
|
|
|
|
EXPECT_FALSE(str_endswith("def", "abcdef"));
|
|
|
|
|
|
|
|
|
|
EXPECT_TRUE(str_endswith("xyz", ""));
|
|
|
|
|
EXPECT_FALSE(str_endswith("", "xyz"));
|
|
|
|
|
|
|
|
|
|
EXPECT_FALSE(str_endswith("rhyme", "mine"));
|
|
|
|
|
EXPECT_FALSE(str_endswith("blackboard", "black"));
|
|
|
|
|
|
|
|
|
|
EXPECT_TRUE(str_endswith("люди", "юди"));
|
|
|
|
|
EXPECT_FALSE(str_endswith("люди", "любовь"));
|
|
|
|
|
}
|