Files
typthon/Python/pystrhex.c
copilot-swe-agent[bot] b198f511d2 Rename Py_ to Ty_ throughout C API
Massive automated renaming of all Py_/PyObject/etc. prefixes to Ty_/TyObject/etc.
This includes:
- All public API types (TyObject, TyTypeObject, etc.)
- All public API functions (Ty_Initialize, Ty_BuildValue, etc.)
- All internal API (_Ty_ prefixes)
- Reference counting macros (Ty_INCREF, Ty_DECREF, etc.)
- Type flags (Ty_TPFLAGS_*)
- Debug flags (Ty_DEBUG, Ty_TRACE_REFS, etc.)
- All object type APIs (TyList_, TyDict_, TyUnicode_, etc.)

This changes over 60,000 occurrences across 1000+ files.

Co-authored-by: johndoe6345789 <224850594+johndoe6345789@users.noreply.github.com>
2025-12-29 17:37:49 +00:00

173 lines
5.3 KiB
C

/* Format bytes as hexadecimal */
#include "Python.h"
#include "pycore_strhex.h" // _Ty_strhex_with_sep()
#include "pycore_unicodeobject.h" // _TyUnicode_CheckConsistency()
static TyObject *_Ty_strhex_impl(const char* argbuf, const Ty_ssize_t arglen,
TyObject* sep, int bytes_per_sep_group,
const int return_bytes)
{
assert(arglen >= 0);
Ty_UCS1 sep_char = 0;
if (sep) {
Ty_ssize_t seplen = PyObject_Length((TyObject*)sep);
if (seplen < 0) {
return NULL;
}
if (seplen != 1) {
TyErr_SetString(TyExc_ValueError, "sep must be length 1.");
return NULL;
}
if (TyUnicode_Check(sep)) {
if (TyUnicode_KIND(sep) != TyUnicode_1BYTE_KIND) {
TyErr_SetString(TyExc_ValueError, "sep must be ASCII.");
return NULL;
}
sep_char = TyUnicode_READ_CHAR(sep, 0);
}
else if (TyBytes_Check(sep)) {
sep_char = TyBytes_AS_STRING(sep)[0];
}
else {
TyErr_SetString(TyExc_TypeError, "sep must be str or bytes.");
return NULL;
}
if (sep_char > 127 && !return_bytes) {
TyErr_SetString(TyExc_ValueError, "sep must be ASCII.");
return NULL;
}
}
else {
bytes_per_sep_group = 0;
}
unsigned int abs_bytes_per_sep = Ty_ABS(bytes_per_sep_group);
Ty_ssize_t resultlen = 0;
if (bytes_per_sep_group && arglen > 0) {
/* How many sep characters we'll be inserting. */
resultlen = (arglen - 1) / abs_bytes_per_sep;
}
/* Bounds checking for our Ty_ssize_t indices. */
if (arglen >= PY_SSIZE_T_MAX / 2 - resultlen) {
return TyErr_NoMemory();
}
resultlen += arglen * 2;
if ((size_t)abs_bytes_per_sep >= (size_t)arglen) {
bytes_per_sep_group = 0;
abs_bytes_per_sep = 0;
}
TyObject *retval;
Ty_UCS1 *retbuf;
if (return_bytes) {
/* If _TyBytes_FromSize() were public we could avoid malloc+copy. */
retval = TyBytes_FromStringAndSize(NULL, resultlen);
if (!retval) {
return NULL;
}
retbuf = (Ty_UCS1 *)TyBytes_AS_STRING(retval);
}
else {
retval = TyUnicode_New(resultlen, 127);
if (!retval) {
return NULL;
}
retbuf = TyUnicode_1BYTE_DATA(retval);
}
/* Hexlify */
Ty_ssize_t i, j;
unsigned char c;
if (bytes_per_sep_group == 0) {
for (i = j = 0; i < arglen; ++i) {
assert((j + 1) < resultlen);
c = argbuf[i];
retbuf[j++] = Ty_hexdigits[c >> 4];
retbuf[j++] = Ty_hexdigits[c & 0x0f];
}
assert(j == resultlen);
}
else {
/* The number of complete chunk+sep periods */
Ty_ssize_t chunks = (arglen - 1) / abs_bytes_per_sep;
Ty_ssize_t chunk;
unsigned int k;
if (bytes_per_sep_group < 0) {
i = j = 0;
for (chunk = 0; chunk < chunks; chunk++) {
for (k = 0; k < abs_bytes_per_sep; k++) {
c = argbuf[i++];
retbuf[j++] = Ty_hexdigits[c >> 4];
retbuf[j++] = Ty_hexdigits[c & 0x0f];
}
retbuf[j++] = sep_char;
}
while (i < arglen) {
c = argbuf[i++];
retbuf[j++] = Ty_hexdigits[c >> 4];
retbuf[j++] = Ty_hexdigits[c & 0x0f];
}
assert(j == resultlen);
}
else {
i = arglen - 1;
j = resultlen - 1;
for (chunk = 0; chunk < chunks; chunk++) {
for (k = 0; k < abs_bytes_per_sep; k++) {
c = argbuf[i--];
retbuf[j--] = Ty_hexdigits[c & 0x0f];
retbuf[j--] = Ty_hexdigits[c >> 4];
}
retbuf[j--] = sep_char;
}
while (i >= 0) {
c = argbuf[i--];
retbuf[j--] = Ty_hexdigits[c & 0x0f];
retbuf[j--] = Ty_hexdigits[c >> 4];
}
assert(j == -1);
}
}
#ifdef Ty_DEBUG
if (!return_bytes) {
assert(_TyUnicode_CheckConsistency(retval, 1));
}
#endif
return retval;
}
TyObject * _Ty_strhex(const char* argbuf, const Ty_ssize_t arglen)
{
return _Ty_strhex_impl(argbuf, arglen, NULL, 0, 0);
}
/* Same as above but returns a bytes() instead of str() to avoid the
* need to decode the str() when bytes are needed. */
TyObject* _Ty_strhex_bytes(const char* argbuf, const Ty_ssize_t arglen)
{
return _Ty_strhex_impl(argbuf, arglen, NULL, 0, 1);
}
/* These variants include support for a separator between every N bytes: */
TyObject* _Ty_strhex_with_sep(const char* argbuf, const Ty_ssize_t arglen,
TyObject* sep, const int bytes_per_group)
{
return _Ty_strhex_impl(argbuf, arglen, sep, bytes_per_group, 0);
}
/* Same as above but returns a bytes() instead of str() to avoid the
* need to decode the str() when bytes are needed. */
TyObject* _Ty_strhex_bytes_with_sep(const char* argbuf, const Ty_ssize_t arglen,
TyObject* sep, const int bytes_per_group)
{
return _Ty_strhex_impl(argbuf, arglen, sep, bytes_per_group, 1);
}