mirror of
https://github.com/jart/cosmopolitan.git
synced 2025-07-25 12:00:31 +00:00
Do some string library work
This commit is contained in:
parent
83d41e4588
commit
35203c0551
42 changed files with 1381 additions and 136 deletions
|
@ -41,7 +41,7 @@ static const int16_t kDel16[8] = {127, 127, 127, 127, 127, 127, 127, 127};
|
|||
* @param n if -1 implies strlen
|
||||
* @param z if non-NULL receives output length
|
||||
*/
|
||||
char *utf16toutf8(const char16_t *p, size_t n, size_t *z) {
|
||||
char *utf16to8(const char16_t *p, size_t n, size_t *z) {
|
||||
char *r, *q;
|
||||
wint_t x, y;
|
||||
unsigned m, j, w;
|
51
libc/x/utf32to8.c
Normal file
51
libc/x/utf32to8.c
Normal file
|
@ -0,0 +1,51 @@
|
|||
/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│
|
||||
│vi: set net ft=c ts=2 sts=2 sw=2 fenc=utf-8 :vi│
|
||||
╞══════════════════════════════════════════════════════════════════════════════╡
|
||||
│ Copyright 2022 Justine Alexandra Roberts Tunney │
|
||||
│ │
|
||||
│ Permission to use, copy, modify, and/or distribute this software for │
|
||||
│ any purpose with or without fee is hereby granted, provided that the │
|
||||
│ above copyright notice and this permission notice appear in all copies. │
|
||||
│ │
|
||||
│ THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL │
|
||||
│ WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED │
|
||||
│ WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE │
|
||||
│ AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL │
|
||||
│ DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR │
|
||||
│ PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER │
|
||||
│ TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR │
|
||||
│ PERFORMANCE OF THIS SOFTWARE. │
|
||||
╚─────────────────────────────────────────────────────────────────────────────*/
|
||||
#include "libc/mem/mem.h"
|
||||
#include "libc/str/str.h"
|
||||
#include "libc/str/tpenc.h"
|
||||
#include "libc/x/x.h"
|
||||
|
||||
/**
|
||||
* Transcodes UTF-32 to UTF-8.
|
||||
*
|
||||
* @param p is input value
|
||||
* @param n if -1 implies wcslen
|
||||
* @param z if non-NULL receives output length
|
||||
*/
|
||||
char *utf32to8(const wchar_t *p, size_t n, size_t *z) {
|
||||
size_t i;
|
||||
wint_t x;
|
||||
uint64_t w;
|
||||
char *r, *q;
|
||||
if (z) *z = 0;
|
||||
if (n == -1) n = p ? wcslen(p) : 0;
|
||||
if ((q = r = malloc(n * 6 + 1))) {
|
||||
for (i = 0; i < n; ++i) {
|
||||
x = p[i];
|
||||
w = tpenc(x);
|
||||
do {
|
||||
*q++ = w;
|
||||
} while ((w >>= 8));
|
||||
}
|
||||
if (z) *z = q - r;
|
||||
*q++ = '\0';
|
||||
if ((q = realloc(r, q - r))) r = q;
|
||||
}
|
||||
return r;
|
||||
}
|
|
@ -29,7 +29,7 @@
|
|||
* @param n if -1 implies strlen
|
||||
* @param z if non-NULL receives output length
|
||||
*/
|
||||
char16_t *utf8toutf16(const char *p, size_t n, size_t *z) {
|
||||
char16_t *utf8to16(const char *p, size_t n, size_t *z) {
|
||||
size_t i;
|
||||
wint_t x, a, b;
|
||||
char16_t *r, *q;
|
|
@ -16,6 +16,7 @@
|
|||
│ TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR │
|
||||
│ PERFORMANCE OF THIS SOFTWARE. │
|
||||
╚─────────────────────────────────────────────────────────────────────────────*/
|
||||
#include "libc/intrin/likely.h"
|
||||
#include "libc/intrin/pcmpgtb.h"
|
||||
#include "libc/intrin/pmovmskb.h"
|
||||
#include "libc/intrin/punpckhbw.h"
|
||||
|
@ -35,7 +36,8 @@
|
|||
* @param n if -1 implies strlen
|
||||
* @param z if non-NULL receives output length
|
||||
*/
|
||||
wchar_t *utf8toutf32(const char *p, size_t n, size_t *z) {
|
||||
wchar_t *utf8to32(const char *p, size_t n, size_t *z) {
|
||||
int e;
|
||||
size_t i;
|
||||
unsigned m, j;
|
||||
wint_t x, a, b;
|
||||
|
@ -45,7 +47,8 @@ wchar_t *utf8toutf32(const char *p, size_t n, size_t *z) {
|
|||
if (n == -1) n = p ? strlen(p) : 0;
|
||||
if ((q = r = malloc(n * sizeof(wchar_t) + sizeof(wchar_t)))) {
|
||||
for (i = 0; i < n;) {
|
||||
if (i + 16 < n) { /* 10x speedup for ascii */
|
||||
if (!((uintptr_t)(p + i) & 15) && i + 16 < n) {
|
||||
/* 10x speedup for ascii */
|
||||
bzero(vz, 16);
|
||||
do {
|
||||
memcpy(v1, p + i, 16);
|
|
@ -52,10 +52,11 @@ char *xstrmul(const char *, size_t) paramsnonnull((1)) _XMAL;
|
|||
char *xinet_ntop(int, const void *) _XPNN _XMAL;
|
||||
void *xunbinga(size_t, const char16_t *) attributeallocalign((1)) _XMAL _XRET;
|
||||
void *xunbing(const char16_t *) _XMAL _XRET;
|
||||
char16_t *utf8toutf16(const char *, size_t, size_t *) dontdiscard;
|
||||
char *utf16toutf8(const char16_t *, size_t, size_t *) dontdiscard;
|
||||
wchar_t *utf8toutf32(const char *, size_t, size_t *) dontdiscard;
|
||||
char16_t *utf8to16(const char *, size_t, size_t *) dontdiscard;
|
||||
char *utf16to8(const char16_t *, size_t, size_t *) dontdiscard;
|
||||
wchar_t *utf8to32(const char *, size_t, size_t *) dontdiscard;
|
||||
wchar_t *utf16to32(const char16_t *, size_t, size_t *) dontdiscard;
|
||||
char *utf32to8(const wchar_t *, size_t, size_t *) dontdiscard;
|
||||
char *xhomedir(void) dontdiscard;
|
||||
char *xstripext(const char *) dontdiscard;
|
||||
char *xstripexts(const char *) dontdiscard;
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue