Improve Libc by making Python work even better

Actually Portable Python is now outperforming the Python binaries that come bundled with Linux distros, at things like HTTP serving. You can now have a fully featured Python install in just one .com file that runs on six operating systems and is about 10mb in size. With tuning, the tiniest is ~1mb. We've got most of the libraries working, including pysqlite, and the repl now feels very pleasant. The things you can't do quite yet are: threads and shared objects but that can happen in the future, if the community falls in love with this project and wants to see it developed further. Changes: - Add siginterrupt() - Add sqlite3 to Python - Add issymlink() helper - Make GetZipCdir() faster - Add tgamma() and finite() - Add legacy function lutimes() - Add readlink() and realpath() - Use heap allocations when appropriate - Reorganize Python into two-stage build - Save Lua / Python shell history to dotfile - Integrate Python Lib embedding into linkage - Make isregularfile() and isdirectory() go faster - Make Python shell auto-completion work perfectly - Make crash reports work better if changed directory - Fix Python+NT open() / access() flag overflow error - Disable Python tests relating to \N{LONG NAME} syntax - Have Python REPL copyright() show all notice embeddings The biggest technical challenge at the moment is working around when Python tries to be too clever about filenames.
2025-10-20 08:30:00 +00:00 · 2021-08-18 14:21:30 -07:00 · 2021-08-18 14:21:30 -07:00 · 8af197560e
commit 8af197560e
parent 98ccbf44b1
179 changed files with 6728 additions and 10430 deletions
--- a/third_party/python/Lib/test/test_codeccallbacks.py
+++ b/third_party/python/Lib/test/test_codeccallbacks.py
@ -149,21 +149,20 @@ class CodecCallbackTest(unittest.TestCase):
        sout = b"a\xac\\u1234\xa4\\u8000\\U0010ffff"
        self.assertEqual(sin.encode("iso-8859-15", "backslashreplace"), sout)

-    def test_nameescape(self):
-        # Does the same as backslashescape, but prefers ``\N{...}`` escape
-        # sequences.
-        sin = "a\xac\u1234\u20ac\u8000\U0010ffff"
-        sout = (b'a\\N{NOT SIGN}\\N{ETHIOPIC SYLLABLE SEE}\\N{EURO SIGN}'
-                b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
-        self.assertEqual(sin.encode("ascii", "namereplace"), sout)
-
-        sout = (b'a\xac\\N{ETHIOPIC SYLLABLE SEE}\\N{EURO SIGN}'
-                b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
-        self.assertEqual(sin.encode("latin-1", "namereplace"), sout)
-
-        sout = (b'a\xac\\N{ETHIOPIC SYLLABLE SEE}\xa4'
-                b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
-        self.assertEqual(sin.encode("iso-8859-15", "namereplace"), sout)
+    # # TODO(jart): pycomp.com needs \N thing
+    # def test_nameescape(self):
+    #     # Does the same as backslashescape, but prefers ``\N{...}`` escape
+    #     # sequences.
+    #     sin = "a\xac\u1234\u20ac\u8000\U0010ffff"
+    #     sout = (b'a\\N{NOT SIGN}\\N{ETHIOPIC SYLLABLE SEE}\\N{EURO SIGN}'
+    #             b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
+    #     self.assertEqual(sin.encode("ascii", "namereplace"), sout)
+    #     sout = (b'a\xac\\N{ETHIOPIC SYLLABLE SEE}\\N{EURO SIGN}'
+    #             b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
+    #     self.assertEqual(sin.encode("latin-1", "namereplace"), sout)
+    #     sout = (b'a\xac\\N{ETHIOPIC SYLLABLE SEE}\xa4'
+    #             b'\\N{CJK UNIFIED IDEOGRAPH-8000}\\U0010ffff')
+    #     self.assertEqual(sin.encode("iso-8859-15", "namereplace"), sout)

    def test_decoding_callbacks(self):
        # This is a test for a decoding callback handler
@ -615,51 +614,52 @@ class CodecCallbackTest(unittest.TestCase):
                    (r, 2)
                )

-    def test_badandgoodnamereplaceexceptions(self):
-        # "namereplace" complains about a non-exception passed in
-        self.assertRaises(
-           TypeError,
-           codecs.namereplace_errors,
-           42
-        )
-        # "namereplace" complains about the wrong exception types
-        self.assertRaises(
-           TypeError,
-           codecs.namereplace_errors,
-           UnicodeError("ouch")
-        )
-        # "namereplace" can only be used for encoding
-        self.assertRaises(
-            TypeError,
-            codecs.namereplace_errors,
-            UnicodeDecodeError("ascii", bytearray(b"\xff"), 0, 1, "ouch")
-        )
-        self.assertRaises(
-            TypeError,
-            codecs.namereplace_errors,
-            UnicodeTranslateError("\u3042", 0, 1, "ouch")
-        )
-        # Use the correct exception
-        tests = [
-            ("\u3042", "\\N{HIRAGANA LETTER A}"),
-            ("\x00", "\\x00"),
-            ("\ufbf9", "\\N{ARABIC LIGATURE UIGHUR KIRGHIZ YEH WITH "
-                       "HAMZA ABOVE WITH ALEF MAKSURA ISOLATED FORM}"),
-            ("\U000e007f", "\\N{CANCEL TAG}"),
-            ("\U0010ffff", "\\U0010ffff"),
-            # Lone surrogates
-            ("\ud800", "\\ud800"),
-            ("\udfff", "\\udfff"),
-            ("\ud800\udfff", "\\ud800\\udfff"),
-        ]
-        for s, r in tests:
-            with self.subTest(str=s):
-                self.assertEqual(
-                    codecs.namereplace_errors(
-                        UnicodeEncodeError("ascii", "a" + s + "b",
-                                           1, 1 + len(s), "ouch")),
-                    (r, 1 + len(s))
-                )
+    # # TODO(jart): pycomp.com needs \N thing
+    # def test_badandgoodnamereplaceexceptions(self):
+    #     # "namereplace" complains about a non-exception passed in
+    #     self.assertRaises(
+    #        TypeError,
+    #        codecs.namereplace_errors,
+    #        42
+    #     )
+    #     # "namereplace" complains about the wrong exception types
+    #     self.assertRaises(
+    #        TypeError,
+    #        codecs.namereplace_errors,
+    #        UnicodeError("ouch")
+    #     )
+    #     # "namereplace" can only be used for encoding
+    #     self.assertRaises(
+    #         TypeError,
+    #         codecs.namereplace_errors,
+    #         UnicodeDecodeError("ascii", bytearray(b"\xff"), 0, 1, "ouch")
+    #     )
+    #     self.assertRaises(
+    #         TypeError,
+    #         codecs.namereplace_errors,
+    #         UnicodeTranslateError("\u3042", 0, 1, "ouch")
+    #     )
+    #     # Use the correct exception
+    #     tests = [
+    #         ("\u3042", "\\N{HIRAGANA LETTER A}"),
+    #         ("\x00", "\\x00"),
+    #         ("\ufbf9", "\\N{ARABIC LIGATURE UIGHUR KIRGHIZ YEH WITH "
+    #                    "HAMZA ABOVE WITH ALEF MAKSURA ISOLATED FORM}"),
+    #         ("\U000e007f", "\\N{CANCEL TAG}"),
+    #         ("\U0010ffff", "\\U0010ffff"),
+    #         # Lone surrogates
+    #         ("\ud800", "\\ud800"),
+    #         ("\udfff", "\\udfff"),
+    #         ("\ud800\udfff", "\\ud800\\udfff"),
+    #     ]
+    #     for s, r in tests:
+    #         with self.subTest(str=s):
+    #             self.assertEqual(
+    #                 codecs.namereplace_errors(
+    #                     UnicodeEncodeError("ascii", "a" + s + "b",
+    #                                        1, 1 + len(s), "ouch")),
+    #                 (r, 1 + len(s))
+    #             )

    def test_badandgoodsurrogateescapeexceptions(self):
        surrogateescape_errors = codecs.lookup_error('surrogateescape')