| |
| /* Support for dynamic loading of extension modules */ |
| |
| #include "Python.h" |
| #include "pycore_call.h" |
| #include "pycore_import.h" |
| #include "pycore_pyerrors.h" // _PyErr_FormatFromCause() |
| #include "pycore_pystate.h" |
| #include "pycore_runtime.h" |
| |
| /* ./configure sets HAVE_DYNAMIC_LOADING if dynamic loading of modules is |
| supported on this platform. configure will then compile and link in one |
| of the dynload_*.c files, as appropriate. We will call a function in |
| those modules to get a function pointer to the module's init function. |
| */ |
| #ifdef HAVE_DYNAMIC_LOADING |
| |
| #include "pycore_importdl.h" |
| |
| #ifdef MS_WINDOWS |
| extern dl_funcptr _PyImport_FindSharedFuncptrWindows(const char *prefix, |
| const char *shortname, |
| PyObject *pathname, |
| FILE *fp); |
| #else |
| extern dl_funcptr _PyImport_FindSharedFuncptr(const char *prefix, |
| const char *shortname, |
| const char *pathname, FILE *fp); |
| #endif |
| |
| |
| /***********************************/ |
| /* module info to use when loading */ |
| /***********************************/ |
| |
| static const char * const ascii_only_prefix = "PyInit"; |
| static const char * const nonascii_prefix = "PyInitU"; |
| |
| /* Get the variable part of a module's export symbol name. |
| * Returns a bytes instance. For non-ASCII-named modules, the name is |
| * encoded as per PEP 489. |
| * The hook_prefix pointer is set to either ascii_only_prefix or |
| * nonascii_prefix, as appropriate. |
| */ |
| static PyObject * |
| get_encoded_name(PyObject *name, const char **hook_prefix) { |
| PyObject *tmp; |
| PyObject *encoded = NULL; |
| PyObject *modname = NULL; |
| Py_ssize_t name_len, lastdot; |
| |
| /* Get the short name (substring after last dot) */ |
| name_len = PyUnicode_GetLength(name); |
| if (name_len < 0) { |
| return NULL; |
| } |
| lastdot = PyUnicode_FindChar(name, '.', 0, name_len, -1); |
| if (lastdot < -1) { |
| return NULL; |
| } else if (lastdot >= 0) { |
| tmp = PyUnicode_Substring(name, lastdot + 1, name_len); |
| if (tmp == NULL) |
| return NULL; |
| name = tmp; |
| /* "name" now holds a new reference to the substring */ |
| } else { |
| Py_INCREF(name); |
| } |
| |
| /* Encode to ASCII or Punycode, as needed */ |
| encoded = PyUnicode_AsEncodedString(name, "ascii", NULL); |
| if (encoded != NULL) { |
| *hook_prefix = ascii_only_prefix; |
| } else { |
| if (PyErr_ExceptionMatches(PyExc_UnicodeEncodeError)) { |
| PyErr_Clear(); |
| encoded = PyUnicode_AsEncodedString(name, "punycode", NULL); |
| if (encoded == NULL) { |
| goto error; |
| } |
| *hook_prefix = nonascii_prefix; |
| } else { |
| goto error; |
| } |
| } |
| |
| /* Replace '-' by '_' */ |
| modname = _PyObject_CallMethod(encoded, &_Py_ID(replace), "cc", '-', '_'); |
| if (modname == NULL) |
| goto error; |
| |
| Py_DECREF(name); |
| Py_DECREF(encoded); |
| return modname; |
| error: |
| Py_DECREF(name); |
| Py_XDECREF(encoded); |
| return NULL; |
| } |
| |
| void |
| _Py_ext_module_loader_info_clear(struct _Py_ext_module_loader_info *info) |
| { |
| Py_CLEAR(info->filename); |
| #ifndef MS_WINDOWS |
| Py_CLEAR(info->filename_encoded); |
| #endif |
| Py_CLEAR(info->name); |
| Py_CLEAR(info->name_encoded); |
| } |
| |
| int |
| _Py_ext_module_loader_info_init(struct _Py_ext_module_loader_info *p_info, |
| PyObject *name, PyObject *filename, |
| _Py_ext_module_origin origin) |
| { |
| struct _Py_ext_module_loader_info info = { |
| .origin=origin, |
| }; |
| |
| assert(name != NULL); |
| if (!PyUnicode_Check(name)) { |
| PyErr_SetString(PyExc_TypeError, |
| "module name must be a string"); |
| _Py_ext_module_loader_info_clear(&info); |
| return -1; |
| } |
| assert(PyUnicode_GetLength(name) > 0); |
| info.name = Py_NewRef(name); |
| |
| info.name_encoded = get_encoded_name(info.name, &info.hook_prefix); |
| if (info.name_encoded == NULL) { |
| _Py_ext_module_loader_info_clear(&info); |
| return -1; |
| } |
| |
| info.newcontext = PyUnicode_AsUTF8(info.name); |
| if (info.newcontext == NULL) { |
| _Py_ext_module_loader_info_clear(&info); |
| return -1; |
| } |
| |
| if (filename != NULL) { |
| if (!PyUnicode_Check(filename)) { |
| PyErr_SetString(PyExc_TypeError, |
| "module filename must be a string"); |
| _Py_ext_module_loader_info_clear(&info); |
| return -1; |
| } |
| info.filename = Py_NewRef(filename); |
| |
| #ifndef MS_WINDOWS |
| info.filename_encoded = PyUnicode_EncodeFSDefault(info.filename); |
| if (info.filename_encoded == NULL) { |
| _Py_ext_module_loader_info_clear(&info); |
| return -1; |
| } |
| #endif |
| |
| info.path = info.filename; |
| } |
| else { |
| info.path = info.name; |
| } |
| |
| *p_info = info; |
| return 0; |
| } |
| |
| int |
| _Py_ext_module_loader_info_init_for_builtin( |
| struct _Py_ext_module_loader_info *info, |
| PyObject *name) |
| { |
| assert(PyUnicode_Check(name)); |
| assert(PyUnicode_FindChar(name, '.', 0, PyUnicode_GetLength(name), -1) == -1); |
| assert(PyUnicode_GetLength(name) > 0); |
| |
| PyObject *name_encoded = PyUnicode_AsEncodedString(name, "ascii", NULL); |
| if (name_encoded == NULL) { |
| return -1; |
| } |
| |
| *info = (struct _Py_ext_module_loader_info){ |
| .name=Py_NewRef(name), |
| .name_encoded=name_encoded, |
| /* We won't need filename. */ |
| .path=name, |
| .origin=_Py_ext_module_origin_BUILTIN, |
| .hook_prefix=ascii_only_prefix, |
| .newcontext=NULL, |
| }; |
| return 0; |
| } |
| |
| int |
| _Py_ext_module_loader_info_init_for_core( |
| struct _Py_ext_module_loader_info *info, |
| PyObject *name) |
| { |
| if (_Py_ext_module_loader_info_init_for_builtin(info, name) < 0) { |
| return -1; |
| } |
| info->origin = _Py_ext_module_origin_CORE; |
| return 0; |
| } |
| |
| int |
| _Py_ext_module_loader_info_init_from_spec( |
| struct _Py_ext_module_loader_info *p_info, |
| PyObject *spec) |
| { |
| PyObject *name = PyObject_GetAttrString(spec, "name"); |
| if (name == NULL) { |
| return -1; |
| } |
| PyObject *filename = PyObject_GetAttrString(spec, "origin"); |
| if (filename == NULL) { |
| Py_DECREF(name); |
| return -1; |
| } |
| /* We could also accommodate builtin modules here without much trouble. */ |
| _Py_ext_module_origin origin = _Py_ext_module_origin_DYNAMIC; |
| int err = _Py_ext_module_loader_info_init(p_info, name, filename, origin); |
| Py_DECREF(name); |
| Py_DECREF(filename); |
| return err; |
| } |
| |
| |
| /********************************/ |
| /* module init function results */ |
| /********************************/ |
| |
| void |
| _Py_ext_module_loader_result_clear(struct _Py_ext_module_loader_result *res) |
| { |
| /* Instead, the caller should have called |
| * _Py_ext_module_loader_result_apply_error(). */ |
| assert(res->err == NULL); |
| *res = (struct _Py_ext_module_loader_result){0}; |
| } |
| |
| static void |
| _Py_ext_module_loader_result_set_error( |
| struct _Py_ext_module_loader_result *res, |
| enum _Py_ext_module_loader_result_error_kind kind) |
| { |
| #ifndef NDEBUG |
| switch (kind) { |
| case _Py_ext_module_loader_result_EXCEPTION: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_UNREPORTED_EXC: |
| assert(PyErr_Occurred()); |
| break; |
| case _Py_ext_module_loader_result_ERR_MISSING: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_UNINITIALIZED: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_NONASCII_NOT_MULTIPHASE: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_NOT_MODULE: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_MISSING_DEF: |
| assert(!PyErr_Occurred()); |
| break; |
| default: |
| /* We added a new error kind but forgot to add it to this switch. */ |
| assert(0); |
| } |
| #endif |
| |
| assert(res->err == NULL && res->_err.exc == NULL); |
| res->err = &res->_err; |
| *res->err = (struct _Py_ext_module_loader_result_error){ |
| .kind=kind, |
| .exc=PyErr_GetRaisedException(), |
| }; |
| |
| /* For some kinds, we also set/check res->kind. */ |
| switch (kind) { |
| case _Py_ext_module_loader_result_ERR_UNINITIALIZED: |
| assert(res->kind == _Py_ext_module_kind_UNKNOWN); |
| res->kind = _Py_ext_module_kind_INVALID; |
| break; |
| /* None of the rest affect the result kind. */ |
| case _Py_ext_module_loader_result_EXCEPTION: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_MISSING: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_UNREPORTED_EXC: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_NONASCII_NOT_MULTIPHASE: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_NOT_MODULE: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_MISSING_DEF: |
| break; |
| default: |
| /* We added a new error kind but forgot to add it to this switch. */ |
| assert(0); |
| } |
| } |
| |
| void |
| _Py_ext_module_loader_result_apply_error( |
| struct _Py_ext_module_loader_result *res, |
| const char *name) |
| { |
| assert(!PyErr_Occurred()); |
| assert(res->err != NULL && res->err == &res->_err); |
| struct _Py_ext_module_loader_result_error err = *res->err; |
| res->err = NULL; |
| |
| /* We're otherwise done with the result at this point. */ |
| _Py_ext_module_loader_result_clear(res); |
| |
| #ifndef NDEBUG |
| switch (err.kind) { |
| case _Py_ext_module_loader_result_EXCEPTION: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_UNREPORTED_EXC: |
| assert(err.exc != NULL); |
| break; |
| case _Py_ext_module_loader_result_ERR_MISSING: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_UNINITIALIZED: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_NONASCII_NOT_MULTIPHASE: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_NOT_MODULE: /* fall through */ |
| case _Py_ext_module_loader_result_ERR_MISSING_DEF: |
| assert(err.exc == NULL); |
| break; |
| default: |
| /* We added a new error kind but forgot to add it to this switch. */ |
| assert(0); |
| } |
| #endif |
| |
| const char *msg = NULL; |
| switch (err.kind) { |
| case _Py_ext_module_loader_result_EXCEPTION: |
| break; |
| case _Py_ext_module_loader_result_ERR_MISSING: |
| msg = "initialization of %s failed without raising an exception"; |
| break; |
| case _Py_ext_module_loader_result_ERR_UNREPORTED_EXC: |
| msg = "initialization of %s raised unreported exception"; |
| break; |
| case _Py_ext_module_loader_result_ERR_UNINITIALIZED: |
| msg = "init function of %s returned uninitialized object"; |
| break; |
| case _Py_ext_module_loader_result_ERR_NONASCII_NOT_MULTIPHASE: |
| msg = "initialization of %s did not return PyModuleDef"; |
| break; |
| case _Py_ext_module_loader_result_ERR_NOT_MODULE: |
| msg = "initialization of %s did not return an extension module"; |
| break; |
| case _Py_ext_module_loader_result_ERR_MISSING_DEF: |
| msg = "initialization of %s did not return a valid extension module"; |
| break; |
| default: |
| /* We added a new error kind but forgot to add it to this switch. */ |
| assert(0); |
| PyErr_Format(PyExc_SystemError, |
| "loading %s failed due to init function", name); |
| return; |
| } |
| |
| if (err.exc != NULL) { |
| PyErr_SetRaisedException(err.exc); |
| err.exc = NULL; /* PyErr_SetRaisedException() stole our reference. */ |
| if (msg != NULL) { |
| _PyErr_FormatFromCause(PyExc_SystemError, msg, name); |
| } |
| } |
| else { |
| assert(msg != NULL); |
| PyErr_Format(PyExc_SystemError, msg, name); |
| } |
| } |
| |
| |
| /********************************************/ |
| /* getting/running the module init function */ |
| /********************************************/ |
| |
| PyModInitFunction |
| _PyImport_GetModInitFunc(struct _Py_ext_module_loader_info *info, |
| FILE *fp) |
| { |
| const char *name_buf = PyBytes_AS_STRING(info->name_encoded); |
| dl_funcptr exportfunc; |
| #ifdef MS_WINDOWS |
| exportfunc = _PyImport_FindSharedFuncptrWindows( |
| info->hook_prefix, name_buf, info->filename, fp); |
| #else |
| { |
| const char *path_buf = PyBytes_AS_STRING(info->filename_encoded); |
| exportfunc = _PyImport_FindSharedFuncptr( |
| info->hook_prefix, name_buf, path_buf, fp); |
| } |
| #endif |
| |
| if (exportfunc == NULL) { |
| if (!PyErr_Occurred()) { |
| PyObject *msg; |
| msg = PyUnicode_FromFormat( |
| "dynamic module does not define " |
| "module export function (%s_%s)", |
| info->hook_prefix, name_buf); |
| if (msg != NULL) { |
| PyErr_SetImportError(msg, info->name, info->filename); |
| Py_DECREF(msg); |
| } |
| } |
| return NULL; |
| } |
| |
| return (PyModInitFunction)exportfunc; |
| } |
| |
| int |
| _PyImport_RunModInitFunc(PyModInitFunction p0, |
| struct _Py_ext_module_loader_info *info, |
| struct _Py_ext_module_loader_result *p_res) |
| { |
| struct _Py_ext_module_loader_result res = { |
| .kind=_Py_ext_module_kind_UNKNOWN, |
| }; |
| |
| /* Call the module init function. */ |
| |
| /* Package context is needed for single-phase init */ |
| const char *oldcontext = _PyImport_SwapPackageContext(info->newcontext); |
| PyObject *m = p0(); |
| _PyImport_SwapPackageContext(oldcontext); |
| |
| /* Validate the result (and populate "res". */ |
| |
| if (m == NULL) { |
| /* The init func for multi-phase init modules is expected |
| * to return a PyModuleDef after calling PyModuleDef_Init(). |
| * That function never raises an exception nor returns NULL, |
| * so at this point it must be a single-phase init modules. */ |
| res.kind = _Py_ext_module_kind_SINGLEPHASE; |
| if (PyErr_Occurred()) { |
| _Py_ext_module_loader_result_set_error( |
| &res, _Py_ext_module_loader_result_EXCEPTION); |
| } |
| else { |
| _Py_ext_module_loader_result_set_error( |
| &res, _Py_ext_module_loader_result_ERR_MISSING); |
| } |
| goto error; |
| } else if (PyErr_Occurred()) { |
| /* Likewise, we infer that this is a single-phase init module. */ |
| res.kind = _Py_ext_module_kind_SINGLEPHASE; |
| _Py_ext_module_loader_result_set_error( |
| &res, _Py_ext_module_loader_result_ERR_UNREPORTED_EXC); |
| /* We would probably be correct to decref m here, |
| * but we weren't doing so before, |
| * so we stick with doing nothing. */ |
| m = NULL; |
| goto error; |
| } |
| |
| if (Py_IS_TYPE(m, NULL)) { |
| /* This can happen when a PyModuleDef is returned without calling |
| * PyModuleDef_Init on it |
| */ |
| _Py_ext_module_loader_result_set_error( |
| &res, _Py_ext_module_loader_result_ERR_UNINITIALIZED); |
| /* Likewise, decref'ing here makes sense. However, the original |
| * code has a note about "prevent segfault in DECREF", |
| * so we play it safe and leave it alone. */ |
| m = NULL; /* prevent segfault in DECREF */ |
| goto error; |
| } |
| |
| if (PyObject_TypeCheck(m, &PyModuleDef_Type)) { |
| /* multi-phase init */ |
| res.kind = _Py_ext_module_kind_MULTIPHASE; |
| res.def = (PyModuleDef *)m; |
| /* Run PyModule_FromDefAndSpec() to finish loading the module. */ |
| } |
| else if (info->hook_prefix == nonascii_prefix) { |
| /* Non-ASCII is only supported for multi-phase init. */ |
| res.kind = _Py_ext_module_kind_MULTIPHASE; |
| /* Don't allow legacy init for non-ASCII module names. */ |
| _Py_ext_module_loader_result_set_error( |
| &res, _Py_ext_module_loader_result_ERR_NONASCII_NOT_MULTIPHASE); |
| goto error; |
| } |
| else { |
| /* single-phase init (legacy) */ |
| res.kind = _Py_ext_module_kind_SINGLEPHASE; |
| res.module = m; |
| |
| if (!PyModule_Check(m)) { |
| _Py_ext_module_loader_result_set_error( |
| &res, _Py_ext_module_loader_result_ERR_NOT_MODULE); |
| goto error; |
| } |
| |
| res.def = _PyModule_GetDef(m); |
| if (res.def == NULL) { |
| PyErr_Clear(); |
| _Py_ext_module_loader_result_set_error( |
| &res, _Py_ext_module_loader_result_ERR_MISSING_DEF); |
| goto error; |
| } |
| } |
| |
| assert(!PyErr_Occurred()); |
| assert(res.err == NULL); |
| *p_res = res; |
| return 0; |
| |
| error: |
| assert(!PyErr_Occurred()); |
| assert(res.err != NULL); |
| Py_CLEAR(res.module); |
| res.def = NULL; |
| *p_res = res; |
| p_res->err = &p_res->_err; |
| return -1; |
| } |
| |
| #endif /* HAVE_DYNAMIC_LOADING */ |