mirror of
https://github.com/jart/cosmopolitan.git
synced 2025-01-31 19:43:32 +00:00
7c83f4abc8
- wcsstr() is now linearly complex - strstr16() is now linearly complex - strstr() is now vectorized on aarch64 (10x) - strstr() now uses KMP on pathological cases - memmem() is now vectorized on aarch64 (10x) - memmem() now uses KMP on pathological cases - Disable shared_ptr::owner_before until fixed - Make iswlower(), iswupper() consistent with glibc - Remove figure space from iswspace() implementation - Include line and paragraph separator in iswcntrl() - Use Musl wcwidth(), iswalpha(), iswpunct(), towlower(), towupper()
88 lines
5.7 KiB
C
88 lines
5.7 KiB
C
/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│
|
|
│ vi: set et ft=c ts=2 sts=2 sw=2 fenc=utf-8 :vi │
|
|
╞══════════════════════════════════════════════════════════════════════════════╡
|
|
│ Copyright 2020 Justine Alexandra Roberts Tunney │
|
|
│ │
|
|
│ Permission to use, copy, modify, and/or distribute this software for │
|
|
│ any purpose with or without fee is hereby granted, provided that the │
|
|
│ above copyright notice and this permission notice appear in all copies. │
|
|
│ │
|
|
│ THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL │
|
|
│ WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED │
|
|
│ WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE │
|
|
│ AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL │
|
|
│ DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR │
|
|
│ PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER │
|
|
│ TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR │
|
|
│ PERFORMANCE OF THIS SOFTWARE. │
|
|
╚─────────────────────────────────────────────────────────────────────────────*/
|
|
#include "libc/stdio/stdio.h"
|
|
#include "libc/str/str.h"
|
|
#include "libc/str/strwidth.h"
|
|
#include "libc/str/unicode.h"
|
|
#include "libc/testlib/benchmark.h"
|
|
#include "libc/testlib/ezbench.h"
|
|
#include "libc/testlib/testlib.h"
|
|
|
|
TEST(wcwidth, test) {
|
|
ASSERT_EQ(0, wcwidth(0));
|
|
ASSERT_EQ(-1, wcwidth(1));
|
|
ASSERT_EQ(-1, wcwidth(-7));
|
|
ASSERT_EQ(1, wcwidth(0x10FFFD));
|
|
ASSERT_EQ(-1, wcwidth(0x10FFFD + 1));
|
|
ASSERT_EQ(2, wcwidth(L'😀'));
|
|
}
|
|
|
|
TEST(strwidth, testCjkWidesAndCombiningLowLines_withThompsonPikeEncoding) {
|
|
/*───────────────────────────────────────────────────┬─*/
|
|
EXPECT_EQ(20, strwidth(/**/ "𐌰𐌱𐌲𐌳𐌴𐌵𐌶𐌷▒▒▒▒▒▒▒▒▒▒▒▒" /*│*/, 0));
|
|
EXPECT_EQ(20, strwidth(/**/ "(╯°□°)╯𐄻︵ ̲┻̲━̲┻▒▒▒▒▒▒" /*│*/, 0));
|
|
EXPECT_EQ(20, strwidth(/**/ "ちゃぶ台返し▒▒▒▒▒▒▒▒" /*│*/, 0));
|
|
EXPECT_EQ(68, strlen(/*──*/ "𐌰𐌱𐌲𐌳𐌴𐌵𐌶𐌷▒▒▒▒▒▒▒▒▒▒▒▒" /*│*/));
|
|
EXPECT_EQ(56, strlen(/*──*/ "(╯°□°)╯𐄻︵ ̲┻̲━̲┻▒▒▒▒▒▒" /*│*/));
|
|
EXPECT_EQ(42, strlen(/*──*/ "ちゃぶ台返し▒▒▒▒▒▒▒▒" /*│*/));
|
|
/*───────────────────────────────────────────────────┴─*/
|
|
}
|
|
|
|
TEST(strwidth16, testCjkWidesAndCombiningLowLines_lengthIsNotShorts) {
|
|
/*──────────────────────────────────────────────────────┬─*/
|
|
EXPECT_EQ(20, strwidth16(/**/ u"𐌰𐌱𐌲𐌳𐌴𐌵𐌶𐌷▒▒▒▒▒▒▒▒▒▒▒▒" /*│*/, 0));
|
|
EXPECT_EQ(20, strwidth16(/**/ u"(╯°□°)╯𐄻︵ ̲┻̲━̲┻▒▒▒▒▒▒" /*│*/, 0));
|
|
EXPECT_EQ(20, strwidth16(/**/ u"ちゃぶ台返し▒▒▒▒▒▒▒▒" /*│*/, 0));
|
|
EXPECT_EQ(28, strlen16(/*──*/ u"𐌰𐌱𐌲𐌳𐌴𐌵𐌶𐌷▒▒▒▒▒▒▒▒▒▒▒▒" /*│*/));
|
|
EXPECT_EQ(23, strlen16(/*──*/ u"(╯°□°)╯𐄻︵ ̲┻̲━̲┻▒▒▒▒▒▒" /*│*/));
|
|
EXPECT_EQ(14, strlen16(/*──*/ u"ちゃぶ台返し▒▒▒▒▒▒▒▒" /*│*/));
|
|
/*──────────────────────────────────────────────────────┴─*/
|
|
}
|
|
|
|
TEST(wcwidth, testCjkWidesAndCombiningLowLines_widthIsNotLength) {
|
|
/*────────────────────────────────────────────────────┬─*/
|
|
EXPECT_EQ(20, wcswidth(/**/ L"Table flip▒▒▒▒▒▒▒▒▒▒" /*│*/, 0));
|
|
EXPECT_EQ(20, wcswidth(/**/ L"(╯°□°)╯︵ ̲┻̲━̲┻▒▒▒▒▒▒▒" /*│*/, 0));
|
|
EXPECT_EQ(20, wcswidth(/**/ L"ちゃぶ台返し▒▒▒▒▒▒▒▒" /*│*/, 0));
|
|
EXPECT_EQ(20, wcslen(/*──*/ L"Table flip▒▒▒▒▒▒▒▒▒▒" /*│*/));
|
|
EXPECT_EQ(22, wcslen(/*──*/ L"(╯°□°)╯︵ ̲┻̲━̲┻▒▒▒▒▒▒▒" /*│*/));
|
|
EXPECT_EQ(14, wcslen(/*──*/ L"ちゃぶ台返し▒▒▒▒▒▒▒▒" /*│*/));
|
|
/*────────────────────────────────────────────────────┴─*/
|
|
}
|
|
|
|
TEST(wcwidth, block) {
|
|
EXPECT_EQ(1, wcwidth(u'▄'));
|
|
EXPECT_EQ(0x3061, L'ち');
|
|
EXPECT_EQ(2, wcwidth(L'ち'));
|
|
}
|
|
|
|
TEST(strwidth, testTextDelimitingControlCodes_dontHaveSubstance) {
|
|
EXPECT_EQ(0, strwidth("\0", 0));
|
|
EXPECT_EQ(0, strwidth("\1", 0));
|
|
}
|
|
|
|
#define WCWIDTH(x) __expropriate(wcwidth(__veil("r", x)))
|
|
|
|
BENCH(wcwidth, bench) {
|
|
BENCHMARK(1000, 1, WCWIDTH(u'a'));
|
|
BENCHMARK(1000, 1, WCWIDTH(u'a'));
|
|
BENCHMARK(1000, 1, WCWIDTH(u'→'));
|
|
BENCHMARK(1000, 1, WCWIDTH(L'😀'));
|
|
BENCHMARK(1000, 1, WCWIDTH(0));
|
|
}
|