Make numerous improvements

- Python static hello world now 1.8mb
- Python static fully loaded now 10mb
- Python HTTPS client now uses MbedTLS
- Python REPL now completes import stmts
- Increase stack size for Python for now
- Begin synthesizing posixpath and ntpath
- Restore Python \N{UNICODE NAME} support
- Restore Python NFKD symbol normalization
- Add optimized code path for Intel SHA-NI
- Get more Python unit tests passing faster
- Get Python help() pagination working on NT
- Python hashlib now supports MbedTLS PBKDF2
- Make memcpy/memmove/memcmp/bcmp/etc. faster
- Add Mersenne Twister and Vigna to LIBC_RAND
- Provide privileged __printf() for error code
- Fix zipos opendir() so that it reports ENOTDIR
- Add basic chmod() implementation for Windows NT
- Add Cosmo's best functions to Python cosmo module
- Pin function trace indent depth to that of caller
- Show memory diagram on invalid access in MODE=dbg
- Differentiate stack overflow on crash in MODE=dbg
- Add stb_truetype and tools for analyzing font files
- Upgrade to UNICODE 13 and reduce its binary footprint
- COMPILE.COM now logs resource usage of build commands
- Start implementing basic poll() support on bare metal
- Set getauxval(AT_EXECFN) to GetModuleFileName() on NT
- Add descriptions to strerror() in non-TINY build modes
- Add COUNTBRANCH() macro to help with micro-optimizations
- Make error / backtrace / asan / memory code more unbreakable
- Add fast perfect C implementation of μ-Law and a-Law audio codecs
- Make strtol() functions consistent with other libc implementations
- Improve Linenoise implementation (see also github.com/jart/bestline)
- COMPILE.COM now suppresses stdout/stderr of successful build commands
This commit is contained in:
Justine Tunney 2021-09-27 22:58:51 -07:00
parent fa7b4f5bd1
commit 39bf41f4eb
806 changed files with 77494 additions and 63859 deletions

View file

@ -150,20 +150,19 @@ class CodecCallbackTest(unittest.TestCase):
sout = b"a\xac\\u1234\xa4\\u8000\\U0010ffff"
self.assertEqual(sin.encode("iso-8859-15", "backslashreplace"), sout)
# # TODO(jart): pycomp.com needs \N thing
# def test_nameescape(self):
# # Does the same as backslashescape, but prefers ``\N{...}`` escape
# # sequences.
# sin = "a\xac\u1234\u20ac\u8000\U0010ffff"
# sout = (b'a\\N{NOT SIGN}\\N{ETHIOPIC SYLLABLE SEE}\\N{EURO SIGN}'
# b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
# self.assertEqual(sin.encode("ascii", "namereplace"), sout)
# sout = (b'a\xac\\N{ETHIOPIC SYLLABLE SEE}\\N{EURO SIGN}'
# b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
# self.assertEqual(sin.encode("latin-1", "namereplace"), sout)
# sout = (b'a\xac\\N{ETHIOPIC SYLLABLE SEE}\xa4'
# b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
# self.assertEqual(sin.encode("iso-8859-15", "namereplace"), sout)
def test_nameescape(self):
# Does the same as backslashescape, but prefers ``\N{...}`` escape
# sequences.
sin = "a\xac\u1234\u20ac\u8000\U0010ffff"
sout = (b'a\\N{NOT SIGN}\\N{ETHIOPIC SYLLABLE SEE}\\N{EURO SIGN}'
b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
self.assertEqual(sin.encode("ascii", "namereplace"), sout)
sout = (b'a\xac\\N{ETHIOPIC SYLLABLE SEE}\\N{EURO SIGN}'
b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
self.assertEqual(sin.encode("latin-1", "namereplace"), sout)
sout = (b'a\xac\\N{ETHIOPIC SYLLABLE SEE}\xa4'
b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
self.assertEqual(sin.encode("iso-8859-15", "namereplace"), sout)
def test_decoding_callbacks(self):
# This is a test for a decoding callback handler
@ -615,52 +614,51 @@ class CodecCallbackTest(unittest.TestCase):
(r, 2)
)
# # TODO(jart): pycomp.com needs \N thing
# def test_badandgoodnamereplaceexceptions(self):
# # "namereplace" complains about a non-exception passed in
# self.assertRaises(
# TypeError,
# codecs.namereplace_errors,
# 42
# )
# # "namereplace" complains about the wrong exception types
# self.assertRaises(
# TypeError,
# codecs.namereplace_errors,
# UnicodeError("ouch")
# )
# # "namereplace" can only be used for encoding
# self.assertRaises(
# TypeError,
# codecs.namereplace_errors,
# UnicodeDecodeError("ascii", bytearray(b"\xff"), 0, 1, "ouch")
# )
# self.assertRaises(
# TypeError,
# codecs.namereplace_errors,
# UnicodeTranslateError("\u3042", 0, 1, "ouch")
# )
# # Use the correct exception
# tests = [
# ("\u3042", "\\N{HIRAGANA LETTER A}"),
# ("\x00", "\\x00"),
# ("\ufbf9", "\\N{ARABIC LIGATURE UIGHUR KIRGHIZ YEH WITH "
# "HAMZA ABOVE WITH ALEF MAKSURA ISOLATED FORM}"),
# ("\U000e007f", "\\N{CANCEL TAG}"),
# ("\U0010ffff", "\\U0010ffff"),
# # Lone surrogates
# ("\ud800", "\\ud800"),
# ("\udfff", "\\udfff"),
# ("\ud800\udfff", "\\ud800\\udfff"),
# ]
# for s, r in tests:
# with self.subTest(str=s):
# self.assertEqual(
# codecs.namereplace_errors(
# UnicodeEncodeError("ascii", "a" + s + "b",
# 1, 1 + len(s), "ouch")),
# (r, 1 + len(s))
# )
def test_badandgoodnamereplaceexceptions(self):
# "namereplace" complains about a non-exception passed in
self.assertRaises(
TypeError,
codecs.namereplace_errors,
42
)
# "namereplace" complains about the wrong exception types
self.assertRaises(
TypeError,
codecs.namereplace_errors,
UnicodeError("ouch")
)
# "namereplace" can only be used for encoding
self.assertRaises(
TypeError,
codecs.namereplace_errors,
UnicodeDecodeError("ascii", bytearray(b"\xff"), 0, 1, "ouch")
)
self.assertRaises(
TypeError,
codecs.namereplace_errors,
UnicodeTranslateError("\u3042", 0, 1, "ouch")
)
# Use the correct exception
tests = [
("\u3042", "\\N{HIRAGANA LETTER A}"),
("\x00", "\\x00"),
("\ufbf9", "\\N{ARABIC LIGATURE UIGHUR KIRGHIZ YEH WITH "
"HAMZA ABOVE WITH ALEF MAKSURA ISOLATED FORM}"),
("\U000e007f", "\\N{CANCEL TAG}"),
("\U0010ffff", "\\U0010ffff"),
# Lone surrogates
("\ud800", "\\ud800"),
("\udfff", "\\udfff"),
("\ud800\udfff", "\\ud800\\udfff"),
]
for s, r in tests:
with self.subTest(str=s):
self.assertEqual(
codecs.namereplace_errors(
UnicodeEncodeError("ascii", "a" + s + "b",
1, 1 + len(s), "ouch")),
(r, 1 + len(s))
)
def test_badandgoodsurrogateescapeexceptions(self):
surrogateescape_errors = codecs.lookup_error('surrogateescape')