Files
typthon/Modules/md5module.c
copilot-swe-agent[bot] 42e2356c88 Fix incorrect replacements in Py_ to Ty_ renaming
Fixed several macros and constants that should not have been renamed:
- _Py_CAST, _Py_NULL, _Py_RVALUE (internal utility macros)
- Py_UNUSED (unused parameter macro)
- Py_EQ, Py_NE, Py_LT, Py_LE, Py_GT, Py_GE (comparison constants)
- Py_RETURN_* macros (NONE, TRUE, FALSE, NOTIMPLEMENTED, RICHCOMPARE)
- Py_READONLY, Py_ULL, Py_CONTEXT_SWITCHED
- TyGC_Head in generated clinic files

Build is still in progress with some remaining issues to resolve.

Co-authored-by: johndoe6345789 <224850594+johndoe6345789@users.noreply.github.com>
2025-12-29 17:44:05 +00:00

411 lines
9.6 KiB
C

/* MD5 module */
/* This module provides an interface to the MD5 algorithm */
/* See below for information about the original code this module was
based upon. Additional work performed by:
Andrew Kuchling (amk@amk.ca)
Greg Stein (gstein@lyra.org)
Trevor Perrin (trevp@trevp.net)
Copyright (C) 2005-2007 Gregory P. Smith (greg@krypto.org)
Licensed to PSF under a Contributor Agreement.
*/
/* MD5 objects */
#ifndef Ty_BUILD_CORE_BUILTIN
# define Ty_BUILD_CORE_MODULE 1
#endif
#include "Python.h"
#include "hashlib.h"
/*[clinic input]
module _md5
class MD5Type "MD5object *" "&TyType_Type"
[clinic start generated code]*/
/*[clinic end generated code: output=da39a3ee5e6b4b0d input=6e5261719957a912]*/
/* The MD5 block size and message digest sizes, in bytes */
#define MD5_BLOCKSIZE 64
#define MD5_DIGESTSIZE 16
#include "_hacl/Hacl_Hash_MD5.h"
typedef struct {
PyObject_HEAD
// Prevents undefined behavior via multiple threads entering the C API.
bool use_mutex;
PyMutex mutex;
Hacl_Hash_MD5_state_t *hash_state;
} MD5object;
#define _MD5object_CAST(op) ((MD5object *)(op))
#include "clinic/md5module.c.h"
typedef struct {
TyTypeObject* md5_type;
} MD5State;
static inline MD5State*
md5_get_state(TyObject *module)
{
void *state = TyModule_GetState(module);
assert(state != NULL);
return (MD5State *)state;
}
static MD5object *
newMD5object(MD5State * st)
{
MD5object *md5 = PyObject_GC_New(MD5object, st->md5_type);
if (!md5) {
return NULL;
}
HASHLIB_INIT_MUTEX(md5);
PyObject_GC_Track(md5);
return md5;
}
/* Internal methods for a hash object */
static int
MD5_traverse(TyObject *ptr, visitproc visit, void *arg)
{
Ty_VISIT(Ty_TYPE(ptr));
return 0;
}
static void
MD5_dealloc(TyObject *op)
{
MD5object *ptr = _MD5object_CAST(op);
Hacl_Hash_MD5_free(ptr->hash_state);
TyTypeObject *tp = Ty_TYPE(op);
PyObject_GC_UnTrack(ptr);
PyObject_GC_Del(ptr);
Ty_DECREF(tp);
}
/* External methods for a hash object */
/*[clinic input]
MD5Type.copy
cls: defining_class
Return a copy of the hash object.
[clinic start generated code]*/
static TyObject *
MD5Type_copy_impl(MD5object *self, TyTypeObject *cls)
/*[clinic end generated code: output=bf055e08244bf5ee input=d89087dcfb2a8620]*/
{
MD5State *st = TyType_GetModuleState(cls);
MD5object *newobj;
if ((newobj = newMD5object(st)) == NULL) {
return NULL;
}
ENTER_HASHLIB(self);
newobj->hash_state = Hacl_Hash_MD5_copy(self->hash_state);
LEAVE_HASHLIB(self);
if (newobj->hash_state == NULL) {
Ty_DECREF(self);
return TyErr_NoMemory();
}
return (TyObject *)newobj;
}
/*[clinic input]
MD5Type.digest
Return the digest value as a bytes object.
[clinic start generated code]*/
static TyObject *
MD5Type_digest_impl(MD5object *self)
/*[clinic end generated code: output=eb691dc4190a07ec input=bc0c4397c2994be6]*/
{
unsigned char digest[MD5_DIGESTSIZE];
ENTER_HASHLIB(self);
Hacl_Hash_MD5_digest(self->hash_state, digest);
LEAVE_HASHLIB(self);
return TyBytes_FromStringAndSize((const char *)digest, MD5_DIGESTSIZE);
}
/*[clinic input]
MD5Type.hexdigest
Return the digest value as a string of hexadecimal digits.
[clinic start generated code]*/
static TyObject *
MD5Type_hexdigest_impl(MD5object *self)
/*[clinic end generated code: output=17badced1f3ac932 input=b60b19de644798dd]*/
{
unsigned char digest[MD5_DIGESTSIZE];
ENTER_HASHLIB(self);
Hacl_Hash_MD5_digest(self->hash_state, digest);
LEAVE_HASHLIB(self);
const char *hexdigits = "0123456789abcdef";
char digest_hex[MD5_DIGESTSIZE * 2];
char *str = digest_hex;
for (size_t i=0; i < MD5_DIGESTSIZE; i++) {
unsigned char byte = digest[i];
*str++ = hexdigits[byte >> 4];
*str++ = hexdigits[byte & 0x0f];
}
return TyUnicode_FromStringAndSize(digest_hex, sizeof(digest_hex));
}
static void
update(Hacl_Hash_MD5_state_t *state, uint8_t *buf, Ty_ssize_t len)
{
/*
* Note: we explicitly ignore the error code on the basis that it would
* take more than 1 billion years to overflow the maximum admissible length
* for MD5 (2^61 - 1).
*/
#if PY_SSIZE_T_MAX > UINT32_MAX
while (len > UINT32_MAX) {
(void)Hacl_Hash_MD5_update(state, buf, UINT32_MAX);
len -= UINT32_MAX;
buf += UINT32_MAX;
}
#endif
/* cast to uint32_t is now safe */
(void)Hacl_Hash_MD5_update(state, buf, (uint32_t)len);
}
/*[clinic input]
MD5Type.update
obj: object
/
Update this hash object's state with the provided string.
[clinic start generated code]*/
static TyObject *
MD5Type_update_impl(MD5object *self, TyObject *obj)
/*[clinic end generated code: output=b0fed9a7ce7ad253 input=6e1efcd9ecf17032]*/
{
Ty_buffer buf;
GET_BUFFER_VIEW_OR_ERROUT(obj, &buf);
if (!self->use_mutex && buf.len >= HASHLIB_GIL_MINSIZE) {
self->use_mutex = true;
}
if (self->use_mutex) {
Ty_BEGIN_ALLOW_THREADS
PyMutex_Lock(&self->mutex);
update(self->hash_state, buf.buf, buf.len);
PyMutex_Unlock(&self->mutex);
Ty_END_ALLOW_THREADS
} else {
update(self->hash_state, buf.buf, buf.len);
}
PyBuffer_Release(&buf);
Py_RETURN_NONE;
}
static TyMethodDef MD5_methods[] = {
MD5TYPE_COPY_METHODDEF
MD5TYPE_DIGEST_METHODDEF
MD5TYPE_HEXDIGEST_METHODDEF
MD5TYPE_UPDATE_METHODDEF
{NULL, NULL} /* sentinel */
};
static TyObject *
MD5_get_block_size(TyObject *Py_UNUSED(self), void *Py_UNUSED(closure))
{
return TyLong_FromLong(MD5_BLOCKSIZE);
}
static TyObject *
MD5_get_name(TyObject *Py_UNUSED(self), void *Py_UNUSED(closure))
{
return TyUnicode_FromStringAndSize("md5", 3);
}
static TyObject *
md5_get_digest_size(TyObject *Py_UNUSED(self), void *Py_UNUSED(closure))
{
return TyLong_FromLong(MD5_DIGESTSIZE);
}
static TyGetSetDef MD5_getseters[] = {
{"block_size", MD5_get_block_size, NULL, NULL, NULL},
{"name", MD5_get_name, NULL, NULL, NULL},
{"digest_size", md5_get_digest_size, NULL, NULL, NULL},
{NULL} /* Sentinel */
};
static TyType_Slot md5_type_slots[] = {
{Ty_tp_dealloc, MD5_dealloc},
{Ty_tp_methods, MD5_methods},
{Ty_tp_getset, MD5_getseters},
{Ty_tp_traverse, MD5_traverse},
{0,0}
};
static TyType_Spec md5_type_spec = {
.name = "_md5.md5",
.basicsize = sizeof(MD5object),
.flags = (Ty_TPFLAGS_DEFAULT | Ty_TPFLAGS_DISALLOW_INSTANTIATION |
Ty_TPFLAGS_IMMUTABLETYPE | Ty_TPFLAGS_HAVE_GC),
.slots = md5_type_slots
};
/* The single module-level function: new() */
/*[clinic input]
_md5.md5
data: object(c_default="NULL") = b''
*
usedforsecurity: bool = True
string as string_obj: object(c_default="NULL") = None
Return a new MD5 hash object; optionally initialized with a string.
[clinic start generated code]*/
static TyObject *
_md5_md5_impl(TyObject *module, TyObject *data, int usedforsecurity,
TyObject *string_obj)
/*[clinic end generated code: output=d45e187d3d16f3a8 input=7ea5c5366dbb44bf]*/
{
TyObject *string;
if (_Ty_hashlib_data_argument(&string, data, string_obj) < 0) {
return NULL;
}
MD5object *new;
Ty_buffer buf;
if (string) {
GET_BUFFER_VIEW_OR_ERROUT(string, &buf);
}
MD5State *st = md5_get_state(module);
if ((new = newMD5object(st)) == NULL) {
if (string) {
PyBuffer_Release(&buf);
}
return NULL;
}
new->hash_state = Hacl_Hash_MD5_malloc();
if (new->hash_state == NULL) {
Ty_DECREF(new);
if (string) {
PyBuffer_Release(&buf);
}
return TyErr_NoMemory();
}
if (string) {
if (buf.len >= HASHLIB_GIL_MINSIZE) {
/* We do not initialize self->lock here as this is the constructor
* where it is not yet possible to have concurrent access. */
Ty_BEGIN_ALLOW_THREADS
update(new->hash_state, buf.buf, buf.len);
Ty_END_ALLOW_THREADS
}
else {
update(new->hash_state, buf.buf, buf.len);
}
PyBuffer_Release(&buf);
}
return (TyObject *)new;
}
/* List of functions exported by this module */
static struct TyMethodDef MD5_functions[] = {
_MD5_MD5_METHODDEF
{NULL, NULL} /* Sentinel */
};
static int
_md5_traverse(TyObject *module, visitproc visit, void *arg)
{
MD5State *state = md5_get_state(module);
Ty_VISIT(state->md5_type);
return 0;
}
static int
_md5_clear(TyObject *module)
{
MD5State *state = md5_get_state(module);
Ty_CLEAR(state->md5_type);
return 0;
}
static void
_md5_free(void *module)
{
_md5_clear((TyObject *)module);
}
/* Initialize this module. */
static int
md5_exec(TyObject *m)
{
MD5State *st = md5_get_state(m);
st->md5_type = (TyTypeObject *)TyType_FromModuleAndSpec(
m, &md5_type_spec, NULL);
if (TyModule_AddObjectRef(m, "MD5Type", (TyObject *)st->md5_type) < 0) {
return -1;
}
if (TyModule_AddIntConstant(m, "_GIL_MINSIZE", HASHLIB_GIL_MINSIZE) < 0) {
return -1;
}
return 0;
}
static PyModuleDef_Slot _md5_slots[] = {
{Ty_mod_exec, md5_exec},
{Ty_mod_multiple_interpreters, Ty_MOD_PER_INTERPRETER_GIL_SUPPORTED},
{Ty_mod_gil, Ty_MOD_GIL_NOT_USED},
{0, NULL}
};
static struct TyModuleDef _md5module = {
PyModuleDef_HEAD_INIT,
.m_name = "_md5",
.m_size = sizeof(MD5State),
.m_methods = MD5_functions,
.m_slots = _md5_slots,
.m_traverse = _md5_traverse,
.m_clear = _md5_clear,
.m_free = _md5_free,
};
PyMODINIT_FUNC
PyInit__md5(void)
{
return PyModuleDef_Init(&_md5module);
}