address Victor's review

picnixz · picnixz · commit 303b13c4c61a · 2024-09-25T17:24:50.000+02:00
diff --git a/Lib/test/test_capi/test_codecs.py b/Lib/test/test_capi/test_codecs.py
@@ -592,14 +592,21 @@ def use_custom_encoder(self):
 
     def test_codec_register(self):
         search_function, encoding = self.search_function, self.encoding_name
+        # register the search function using the C API
         self.assertIsNone(_testcapi.codec_register(search_function))
         self.assertIs(self.codecs.lookup(encoding), search_function(encoding))
         self.assertEqual(self.codecs.encode('123', encoding=encoding), '321')
+        # unregister the search function using the regular API
+        self.codecs.unregister(search_function)
+        self.assertRaises(LookupError, self.codecs.lookup, encoding)
 
     def test_codec_unregister(self):
         search_function, encoding = self.search_function, self.encoding_name
         self.assertRaises(LookupError, self.codecs.lookup, encoding)
+        # register the search function using the regular API
         self.codecs.register(search_function)
+        self.assertIsNotNone(self.codecs.lookup(encoding))
+        # unregister the search function using the C API
         self.assertIsNone(_testcapi.codec_unregister(search_function))
         self.assertRaises(LookupError, self.codecs.lookup, encoding)
 
@@ -625,24 +632,23 @@ def test_codec_encode(self):
         encode = _testcapi.codec_encode
         self.assertEqual(encode('a', 'utf-8', NULL), b'a')
         self.assertEqual(encode('a', 'utf-8', 'strict'), b'a')
-        self.assertEqual(encode('é', 'ascii', 'ignore'), b'')
-        # todo: add more cases
+        self.assertEqual(encode('[é]', 'ascii', 'ignore'), b'[]')
+
         self.assertRaises(TypeError, encode, NULL, 'ascii', 'strict')
         # CRASHES encode('a', NULL, 'strict')
 
     def test_codec_decode(self):
         decode = _testcapi.codec_decode
 
-        b = b'a\xc2\xa1\xe4\xbd\xa0\xf0\x9f\x98\x80'
         s = 'a\xa1\u4f60\U0001f600'
+        b = s.encode()
 
         self.assertEqual(decode(b, 'utf-8', 'strict'), s)
         self.assertEqual(decode(b, 'utf-8', NULL), s)
         self.assertEqual(decode(b, 'latin1', 'strict'), b.decode('latin1'))
         self.assertRaises(UnicodeDecodeError, decode, b, 'ascii', 'strict')
         self.assertRaises(UnicodeDecodeError, decode, b, 'ascii', NULL)
         self.assertEqual(decode(b, 'ascii', 'replace'), 'a' + '\ufffd'*9)
-        # todo: add more cases
 
         # _codecs.decode only reports unknown errors policy when they are
         # used (it has a fast path for empty bytes); this is different from
@@ -685,6 +691,7 @@ def test_codec_stream_writer(self):
             writer = _testcapi.codec_stream_writer(encoding, stream, 'strict')
             self.assertIsInstance(writer, self.codec_info.streamwriter)
 
+
 class CAPICodecErrors(unittest.TestCase):
 
     def setUp(self):
diff --git a/Modules/_testcapi/codec.c b/Modules/_testcapi/codec.c
@@ -24,10 +24,9 @@ static PyObject *
 codec_known_encoding(PyObject *Py_UNUSED(module), PyObject *args)
 {
     const char *encoding;   // should not be NULL
-    if (!PyArg_ParseTuple(args, "z", &encoding)) {
+    if (!PyArg_ParseTuple(args, "s", &encoding)) {
         return NULL;
     }
-    assert(encoding != NULL);
     return PyCodec_KnownEncoding(encoding) ? Py_True : Py_False;
 }
 
@@ -39,10 +38,9 @@ codec_encode(PyObject *Py_UNUSED(module), PyObject *args)
     PyObject *input;
     const char *encoding;   // should not be NULL
     const char *errors;     // can be NULL
-    if (!PyArg_ParseTuple(args, "O|zz", &input, &encoding, &errors)) {
+    if (!PyArg_ParseTuple(args, "O|sz", &input, &encoding, &errors)) {
         return NULL;
     }
-    assert(encoding != NULL);
     return PyCodec_Encode(input, encoding, errors);
 }
 
@@ -52,32 +50,29 @@ codec_decode(PyObject *Py_UNUSED(module), PyObject *args)
     PyObject *input;
     const char *encoding;   // should not be NULL
     const char *errors;     // can be NULL
-    if (!PyArg_ParseTuple(args, "O|zz", &input, &encoding, &errors)) {
+    if (!PyArg_ParseTuple(args, "O|sz", &input, &encoding, &errors)) {
         return NULL;
     }
-    assert(encoding != NULL);
     return PyCodec_Decode(input, encoding, errors);
 }
 
 static PyObject *
 codec_encoder(PyObject *Py_UNUSED(module), PyObject *args)
 {
     const char *encoding;  // should not be NULL
-    if (!PyArg_ParseTuple(args, "z", &encoding)) {
+    if (!PyArg_ParseTuple(args, "s", &encoding)) {
         return NULL;
     }
-    assert(encoding != NULL);
     return PyCodec_Encoder(encoding);
 }
 
 static PyObject *
 codec_decoder(PyObject *Py_UNUSED(module), PyObject *args)
 {
     const char *encoding;  // should not be NULL
-    if (!PyArg_ParseTuple(args, "z", &encoding)) {
+    if (!PyArg_ParseTuple(args, "s", &encoding)) {
         return NULL;
     }
-    assert(encoding != NULL);
     return PyCodec_Decoder(encoding);
 }
 
@@ -86,11 +81,9 @@ codec_incremental_encoder(PyObject *Py_UNUSED(module), PyObject *args)
 {
     const char *encoding;   // should not be NULL
     const char *errors;     // should not be NULL
-    if (!PyArg_ParseTuple(args, "zz", &encoding, &errors)) {
+    if (!PyArg_ParseTuple(args, "ss", &encoding, &errors)) {
         return NULL;
     }
-    assert(encoding != NULL);
-    assert(errors != NULL);
     return PyCodec_IncrementalEncoder(encoding, errors);
 }
 
@@ -99,11 +92,9 @@ codec_incremental_decoder(PyObject *Py_UNUSED(module), PyObject *args)
 {
     const char *encoding;   // should not be NULL
     const char *errors;     // should not be NULL
-    if (!PyArg_ParseTuple(args, "zz", &encoding, &errors)) {
+    if (!PyArg_ParseTuple(args, "ss", &encoding, &errors)) {
         return NULL;
     }
-    assert(encoding != NULL);
-    assert(errors != NULL);
     return PyCodec_IncrementalDecoder(encoding, errors);
 }
 
@@ -113,11 +104,9 @@ codec_stream_reader(PyObject *Py_UNUSED(module), PyObject *args)
     const char *encoding;  // should not be NULL
     PyObject *stream;
     const char *errors;    // should not be NULL
-    if (!PyArg_ParseTuple(args, "zOz", &encoding, &stream, &errors)) {
+    if (!PyArg_ParseTuple(args, "sOs", &encoding, &stream, &errors)) {
         return NULL;
     }
-    assert(encoding != NULL);
-    assert(errors != NULL);
     return PyCodec_StreamReader(encoding, stream, errors);
 }
 
@@ -127,11 +116,9 @@ codec_stream_writer(PyObject *Py_UNUSED(module), PyObject *args)
     const char *encoding;  // should not be NULL
     PyObject *stream;
     const char *errors;    // should not be NULL
-    if (!PyArg_ParseTuple(args, "zOz", &encoding, &stream, &errors)) {
+    if (!PyArg_ParseTuple(args, "sOs", &encoding, &stream, &errors)) {
         return NULL;
     }
-    assert(encoding != NULL);
-    assert(errors != NULL);
     return PyCodec_StreamWriter(encoding, stream, errors);
 }
 
@@ -142,10 +129,9 @@ codec_register_error(PyObject *Py_UNUSED(module), PyObject *args)
 {
     const char *encoding;  // should not be NULL
     PyObject *error;
-    if (!PyArg_ParseTuple(args, "zO", &encoding, &error)) {
+    if (!PyArg_ParseTuple(args, "sO", &encoding, &error)) {
         return NULL;
     }
-    assert(encoding != NULL);
     if (PyCodec_RegisterError(encoding, error) < 0) {
         return NULL;
     }

Original file line number	Diff line number	Diff line change
`@@ -24,10 +24,9 @@ static PyObject *`
`24`	`24`	`codec_known_encoding(PyObject Py_UNUSED(module), PyObject args)`
`25`	`25`	`{`
`26`	`26`	`const char *encoding; // should not be NULL`
`27`		`- if (!PyArg_ParseTuple(args, "z", &encoding)) {`
	`27`	`+ if (!PyArg_ParseTuple(args, "s", &encoding)) {`
`28`	`28`	`return NULL;`
`29`	`29`	`}`
`30`		`- assert(encoding != NULL);`
`31`	`30`	`return PyCodec_KnownEncoding(encoding) ? Py_True : Py_False;`
`32`	`31`	`}`
`33`	`32`
`@@ -39,10 +38,9 @@ codec_encode(PyObject Py_UNUSED(module), PyObject args)`
`39`	`38`	`PyObject *input;`
`40`	`39`	`const char *encoding; // should not be NULL`
`41`	`40`	`const char *errors; // can be NULL`
`42`		`- if (!PyArg_ParseTuple(args, "O\|zz", &input, &encoding, &errors)) {`
	`41`	`+ if (!PyArg_ParseTuple(args, "O\|sz", &input, &encoding, &errors)) {`
`43`	`42`	`return NULL;`
`44`	`43`	`}`
`45`		`- assert(encoding != NULL);`
`46`	`44`	`return PyCodec_Encode(input, encoding, errors);`
`47`	`45`	`}`
`48`	`46`
`@@ -52,32 +50,29 @@ codec_decode(PyObject Py_UNUSED(module), PyObject args)`
`52`	`50`	`PyObject *input;`
`53`	`51`	`const char *encoding; // should not be NULL`
`54`	`52`	`const char *errors; // can be NULL`
`55`		`- if (!PyArg_ParseTuple(args, "O\|zz", &input, &encoding, &errors)) {`
	`53`	`+ if (!PyArg_ParseTuple(args, "O\|sz", &input, &encoding, &errors)) {`
`56`	`54`	`return NULL;`
`57`	`55`	`}`
`58`		`- assert(encoding != NULL);`
`59`	`56`	`return PyCodec_Decode(input, encoding, errors);`
`60`	`57`	`}`
`61`	`58`
`62`	`59`	`static PyObject *`
`63`	`60`	`codec_encoder(PyObject Py_UNUSED(module), PyObject args)`
`64`	`61`	`{`
`65`	`62`	`const char *encoding; // should not be NULL`
`66`		`- if (!PyArg_ParseTuple(args, "z", &encoding)) {`
	`63`	`+ if (!PyArg_ParseTuple(args, "s", &encoding)) {`
`67`	`64`	`return NULL;`
`68`	`65`	`}`
`69`		`- assert(encoding != NULL);`
`70`	`66`	`return PyCodec_Encoder(encoding);`
`71`	`67`	`}`
`72`	`68`
`73`	`69`	`static PyObject *`
`74`	`70`	`codec_decoder(PyObject Py_UNUSED(module), PyObject args)`
`75`	`71`	`{`
`76`	`72`	`const char *encoding; // should not be NULL`
`77`		`- if (!PyArg_ParseTuple(args, "z", &encoding)) {`
	`73`	`+ if (!PyArg_ParseTuple(args, "s", &encoding)) {`
`78`	`74`	`return NULL;`
`79`	`75`	`}`
`80`		`- assert(encoding != NULL);`
`81`	`76`	`return PyCodec_Decoder(encoding);`
`82`	`77`	`}`
`83`	`78`
`@@ -86,11 +81,9 @@ codec_incremental_encoder(PyObject Py_UNUSED(module), PyObject args)`
`86`	`81`	`{`
`87`	`82`	`const char *encoding; // should not be NULL`
`88`	`83`	`const char *errors; // should not be NULL`
`89`		`- if (!PyArg_ParseTuple(args, "zz", &encoding, &errors)) {`
	`84`	`+ if (!PyArg_ParseTuple(args, "ss", &encoding, &errors)) {`
`90`	`85`	`return NULL;`
`91`	`86`	`}`
`92`		`- assert(encoding != NULL);`
`93`		`- assert(errors != NULL);`
`94`	`87`	`return PyCodec_IncrementalEncoder(encoding, errors);`
`95`	`88`	`}`
`96`	`89`
`@@ -99,11 +92,9 @@ codec_incremental_decoder(PyObject Py_UNUSED(module), PyObject args)`
`99`	`92`	`{`
`100`	`93`	`const char *encoding; // should not be NULL`
`101`	`94`	`const char *errors; // should not be NULL`
`102`		`- if (!PyArg_ParseTuple(args, "zz", &encoding, &errors)) {`
	`95`	`+ if (!PyArg_ParseTuple(args, "ss", &encoding, &errors)) {`
`103`	`96`	`return NULL;`
`104`	`97`	`}`
`105`		`- assert(encoding != NULL);`
`106`		`- assert(errors != NULL);`
`107`	`98`	`return PyCodec_IncrementalDecoder(encoding, errors);`
`108`	`99`	`}`
`109`	`100`
`@@ -113,11 +104,9 @@ codec_stream_reader(PyObject Py_UNUSED(module), PyObject args)`
`113`	`104`	`const char *encoding; // should not be NULL`
`114`	`105`	`PyObject *stream;`
`115`	`106`	`const char *errors; // should not be NULL`
`116`		`- if (!PyArg_ParseTuple(args, "zOz", &encoding, &stream, &errors)) {`
	`107`	`+ if (!PyArg_ParseTuple(args, "sOs", &encoding, &stream, &errors)) {`
`117`	`108`	`return NULL;`
`118`	`109`	`}`
`119`		`- assert(encoding != NULL);`
`120`		`- assert(errors != NULL);`
`121`	`110`	`return PyCodec_StreamReader(encoding, stream, errors);`
`122`	`111`	`}`
`123`	`112`
`@@ -127,11 +116,9 @@ codec_stream_writer(PyObject Py_UNUSED(module), PyObject args)`
`127`	`116`	`const char *encoding; // should not be NULL`
`128`	`117`	`PyObject *stream;`
`129`	`118`	`const char *errors; // should not be NULL`
`130`		`- if (!PyArg_ParseTuple(args, "zOz", &encoding, &stream, &errors)) {`
	`119`	`+ if (!PyArg_ParseTuple(args, "sOs", &encoding, &stream, &errors)) {`
`131`	`120`	`return NULL;`
`132`	`121`	`}`
`133`		`- assert(encoding != NULL);`
`134`		`- assert(errors != NULL);`
`135`	`122`	`return PyCodec_StreamWriter(encoding, stream, errors);`
`136`	`123`	`}`
`137`	`124`
`@@ -142,10 +129,9 @@ codec_register_error(PyObject Py_UNUSED(module), PyObject args)`
`142`	`129`	`{`
`143`	`130`	`const char *encoding; // should not be NULL`
`144`	`131`	`PyObject *error;`
`145`		`- if (!PyArg_ParseTuple(args, "zO", &encoding, &error)) {`
	`132`	`+ if (!PyArg_ParseTuple(args, "sO", &encoding, &error)) {`
`146`	`133`	`return NULL;`
`147`	`134`	`}`
`148`		`- assert(encoding != NULL);`
`149`	`135`	`if (PyCodec_RegisterError(encoding, error) < 0) {`
`150`	`136`	`return NULL;`
`151`	`137`	`}`