mirror of
https://github.com/jart/cosmopolitan.git
synced 2025-02-28 22:18:29 +00:00
We can now link even smaller Python binaries. For example, the hello.com program in the Python build directory is a compiled linked executable of hello.py which just prints hello world. Using decentralized sections, we can make that binary 1.9mb in size (noting that python.com is 6.3 megs!) This works for nontrivial programs too. For example, say we want an APE binary that's equivalent to python.com -m http.server. Our makefile now builds such a binary using the new launcher and it's only 3.2mb in size since Python sources get turned into ELF objects, which tell our linker that we need things like native hashing algorithm code.
156 lines
2.8 KiB
C
156 lines
2.8 KiB
C
/* clang-format off */
|
|
/*
|
|
* _codecs_tw.c: Codecs collection for Taiwan's encodings
|
|
*
|
|
* Written by Hye-Shik "Bourne to Macro" Chang <perky@FreeBSD.org>
|
|
*/
|
|
|
|
#include "third_party/python/Modules/cjkcodecs/cjkcodecs.h"
|
|
#include "third_party/python/Include/yoink.h"
|
|
#include "third_party/python/Include/import.h"
|
|
#include "third_party/python/Modules/cjkcodecs/mappings_tw.inc"
|
|
|
|
PYTHON_PROVIDE("_codecs_tw");
|
|
PYTHON_PROVIDE("_codecs_tw.__map_big5");
|
|
PYTHON_PROVIDE("_codecs_tw.__map_cp950ext");
|
|
PYTHON_PROVIDE("_codecs_tw.getcodec");
|
|
|
|
/*
|
|
* BIG5 codec
|
|
*/
|
|
|
|
ENCODER(big5)
|
|
{
|
|
while (*inpos < inlen) {
|
|
Py_UCS4 c = INCHAR1;
|
|
DBCHAR code;
|
|
|
|
if (c < 0x80) {
|
|
REQUIRE_OUTBUF(1);
|
|
**outbuf = (unsigned char)c;
|
|
NEXT(1, 1);
|
|
continue;
|
|
}
|
|
|
|
if (c > 0xFFFF)
|
|
return 1;
|
|
|
|
REQUIRE_OUTBUF(2);
|
|
|
|
if (TRYMAP_ENC(big5, code, c))
|
|
;
|
|
else
|
|
return 1;
|
|
|
|
OUTBYTE1(code >> 8);
|
|
OUTBYTE2(code & 0xFF);
|
|
NEXT(1, 2);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
DECODER(big5)
|
|
{
|
|
while (inleft > 0) {
|
|
unsigned char c = INBYTE1;
|
|
Py_UCS4 decoded;
|
|
|
|
if (c < 0x80) {
|
|
OUTCHAR(c);
|
|
NEXT_IN(1);
|
|
continue;
|
|
}
|
|
|
|
REQUIRE_INBUF(2);
|
|
if (TRYMAP_DEC(big5, decoded, c, INBYTE2)) {
|
|
OUTCHAR(decoded);
|
|
NEXT_IN(2);
|
|
}
|
|
else return 1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
/*
|
|
* CP950 codec
|
|
*/
|
|
|
|
ENCODER(cp950)
|
|
{
|
|
while (*inpos < inlen) {
|
|
Py_UCS4 c = INCHAR1;
|
|
DBCHAR code;
|
|
|
|
if (c < 0x80) {
|
|
WRITEBYTE1((unsigned char)c);
|
|
NEXT(1, 1);
|
|
continue;
|
|
}
|
|
|
|
if (c > 0xFFFF)
|
|
return 1;
|
|
|
|
REQUIRE_OUTBUF(2);
|
|
if (TRYMAP_ENC(cp950ext, code, c))
|
|
;
|
|
else if (TRYMAP_ENC(big5, code, c))
|
|
;
|
|
else
|
|
return 1;
|
|
|
|
OUTBYTE1(code >> 8);
|
|
OUTBYTE2(code & 0xFF);
|
|
NEXT(1, 2);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
DECODER(cp950)
|
|
{
|
|
while (inleft > 0) {
|
|
unsigned char c = INBYTE1;
|
|
Py_UCS4 decoded;
|
|
|
|
if (c < 0x80) {
|
|
OUTCHAR(c);
|
|
NEXT_IN(1);
|
|
continue;
|
|
}
|
|
|
|
REQUIRE_INBUF(2);
|
|
|
|
if (TRYMAP_DEC(cp950ext, decoded, c, INBYTE2))
|
|
OUTCHAR(decoded);
|
|
else if (TRYMAP_DEC(big5, decoded, c, INBYTE2))
|
|
OUTCHAR(decoded);
|
|
else
|
|
return 1;
|
|
|
|
NEXT_IN(2);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
|
|
BEGIN_MAPPINGS_LIST
|
|
MAPPING_ENCDEC(big5)
|
|
MAPPING_ENCDEC(cp950ext)
|
|
END_MAPPINGS_LIST
|
|
|
|
BEGIN_CODECS_LIST
|
|
CODEC_STATELESS(big5)
|
|
CODEC_STATELESS(cp950)
|
|
END_CODECS_LIST
|
|
|
|
I_AM_A_MODULE_FOR(tw)
|
|
|
|
_Section(".rodata.pytab.1") const struct _inittab _PyImport_Inittab__codecs_tw = {
|
|
"_codecs_tw",
|
|
PyInit__codecs_tw,
|
|
};
|