-
Notifications
You must be signed in to change notification settings - Fork 2.1k
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Call PySys_SetArgv when initializing interpreter. #2341
Changes from 27 commits
1801811
c3e96c2
5145e58
62243f2
32c1445
3ff967d
27ad85e
fb3de9f
3b8438e
0566160
74243c5
c55ab94
fe38a24
3aa548f
1d7f2b3
d5c1df9
aa3b8b8
0627b12
5c38bc5
8358be4
8d64831
3ad3c6d
abc7b38
65881fe
7763c78
6ddc929
ff2976d
912e1c9
52d88c3
1ede69e
318495e
96cb69f
e5c3305
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change | ||||
---|---|---|---|---|---|---|
|
@@ -11,6 +11,8 @@ | |||||
|
||||||
#include "pybind11.h" | ||||||
#include "eval.h" | ||||||
#include <memory> | ||||||
#include <vector> | ||||||
|
||||||
#if defined(PYPY_VERSION) | ||||||
# error Embedding the interpreter is not supported with PyPy | ||||||
|
@@ -83,29 +85,103 @@ struct embedded_module { | |||||
} | ||||||
}; | ||||||
|
||||||
struct wide_char_arg_deleter { | ||||||
void operator()(wchar_t* ptr) const { | ||||||
#if PY_VERSION_HEX >= 0x030500f0 | ||||||
// API docs: https://docs.python.org/3/c-api/sys.html#c.Py_DecodeLocale | ||||||
PyMem_RawFree(ptr); | ||||||
#else | ||||||
delete[] ptr; | ||||||
#endif | ||||||
} | ||||||
}; | ||||||
|
||||||
inline wchar_t* widen_chars(char* safe_arg) { | ||||||
#if PY_VERSION_HEX >= 0x030500f0 | ||||||
wchar_t* widened_arg = Py_DecodeLocale(safe_arg, nullptr); | ||||||
#else | ||||||
wchar_t* widened_arg = nullptr; | ||||||
# if defined(HAVE_BROKEN_MBSTOWCS) && HAVE_BROKEN_MBSTOWCS | ||||||
size_t count = strlen(safe_arg); | ||||||
# else | ||||||
size_t count = mbstowcs(nullptr, safe_arg, 0); | ||||||
# endif | ||||||
if (count != static_cast<size_t>(-1)) { | ||||||
widened_arg = new wchar_t[count + 1]; | ||||||
mbstowcs(widened_arg, safe_arg, count + 1); | ||||||
} | ||||||
#endif | ||||||
return widened_arg; | ||||||
} | ||||||
|
||||||
/// Python 2.x/3.x-compatible version of `PySys_SetArgv` | ||||||
inline void set_interpreter_argv(int argc, char** argv, bool add_program_dir_to_path) { | ||||||
// Before it was special-cased in python 3.8, passing an empty or null argv | ||||||
// caused a segfault, so we have to reimplement the special case ourselves. | ||||||
char** safe_argv = argv; | ||||||
std::unique_ptr<char*[]> argv_guard; | ||||||
std::unique_ptr<char[]> argv_inner_guard; | ||||||
if (nullptr == argv || argc <= 0) { | ||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
Suggested change
I prefer the variable first (such as in the second half of this line, in fact). |
||||||
argv_guard.reset(safe_argv = new char*[1]); | ||||||
argv_inner_guard.reset(safe_argv[0] = new char[1]); | ||||||
safe_argv[0][0] = '\0'; | ||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Does this function really modify the You can always be more strict; if you have a |
||||||
argc = 1; | ||||||
} | ||||||
#if PY_MAJOR_VERSION >= 3 | ||||||
auto argv_size = static_cast<size_t>(argc); | ||||||
// SetArgv* on python 3 takes wchar_t, so we have to convert. | ||||||
std::unique_ptr<wchar_t*[]> widened_argv(new wchar_t*[argv_size]); | ||||||
Skylion007 marked this conversation as resolved.
Show resolved
Hide resolved
|
||||||
std::vector< std::unique_ptr<wchar_t[], wide_char_arg_deleter> > widened_argv_entries; | ||||||
Skylion007 marked this conversation as resolved.
Show resolved
Hide resolved
|
||||||
for (size_t ii = 0; ii < argv_size; ++ii) { | ||||||
widened_argv_entries.emplace_back(widen_chars(safe_argv[ii])); | ||||||
if (!widened_argv_entries.back()) { | ||||||
// A null here indicates a character-encoding failure or the python | ||||||
// interpreter out of memory. Give up. | ||||||
return; | ||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Should we raise an exception here, instead of silently doing nothing? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I think silently doing nothing is actually OK here. Consider:
That said, I'm not married to the decision. It just seemed like a reasonable fallback to revert to the old behavior. |
||||||
} | ||||||
widened_argv[ii] = widened_argv_entries.back().get(); | ||||||
} | ||||||
|
||||||
auto pysys_argv = widened_argv.get(); | ||||||
#else | ||||||
// python 2.x | ||||||
auto pysys_argv = safe_argv; | ||||||
#endif | ||||||
|
||||||
PySys_SetArgvEx(argc, pysys_argv, static_cast<int>(add_program_dir_to_path)); | ||||||
} | ||||||
|
||||||
PYBIND11_NAMESPACE_END(detail) | ||||||
|
||||||
/** \rst | ||||||
Initialize the Python interpreter. No other pybind11 or CPython API functions can be | ||||||
called before this is done; with the exception of `PYBIND11_EMBEDDED_MODULE`. The | ||||||
optional parameter can be used to skip the registration of signal handlers (see the | ||||||
`Python documentation`_ for details). Calling this function again after the interpreter | ||||||
has already been initialized is a fatal error. | ||||||
optional `init_signal_handlers` parameter can be used to skip the registration of | ||||||
signal handlers (see the `Python documentation`_ for details). Calling this function | ||||||
again after the interpreter has already been initialized is a fatal error. | ||||||
|
||||||
If initializing the Python interpreter fails, then the program is terminated. (This | ||||||
is controlled by the CPython runtime and is an exception to pybind11's normal behavior | ||||||
of throwing exceptions on errors.) | ||||||
|
||||||
The remaining optional parameters, `argc`, `argv`, and `add_program_dir_to_path` are | ||||||
used to populate ``sys.argv`` and ``sys.path``. | ||||||
See the |PySys_SetArgvEx documentation|_ for details. | ||||||
|
||||||
.. _Python documentation: https://docs.python.org/3/c-api/init.html#c.Py_InitializeEx | ||||||
.. |PySys_SetArgvEx documentation| replace:: ``PySys_SetArgvEx`` documentation | ||||||
.. _PySys_SetArgvEx documentation: https://docs.python.org/3/c-api/init.html#c.PySys_SetArgvEx | ||||||
\endrst */ | ||||||
inline void initialize_interpreter(bool init_signal_handlers = true) { | ||||||
inline void initialize_interpreter(bool init_signal_handlers = true, | ||||||
int argc = 0, | ||||||
char** argv = nullptr, | ||||||
bool add_program_dir_to_path = true) { | ||||||
if (Py_IsInitialized() != 0) | ||||||
pybind11_fail("The interpreter is already running"); | ||||||
|
||||||
Py_InitializeEx(init_signal_handlers ? 1 : 0); | ||||||
|
||||||
// Make .py files in the working directory available by default | ||||||
module_::import("sys").attr("path").cast<list>().append("."); | ||||||
detail::set_interpreter_argv(argc, argv, add_program_dir_to_path); | ||||||
} | ||||||
|
||||||
/** \rst | ||||||
|
@@ -167,6 +243,8 @@ inline void finalize_interpreter() { | |||||
Scope guard version of `initialize_interpreter` and `finalize_interpreter`. | ||||||
This a move-only guard and only a single instance can exist. | ||||||
|
||||||
See `initialize_interpreter` for a discussion of its constructor arguments. | ||||||
|
||||||
.. code-block:: cpp | ||||||
|
||||||
#include <pybind11/embed.h> | ||||||
|
@@ -178,8 +256,11 @@ inline void finalize_interpreter() { | |||||
\endrst */ | ||||||
class scoped_interpreter { | ||||||
public: | ||||||
scoped_interpreter(bool init_signal_handlers = true) { | ||||||
initialize_interpreter(init_signal_handlers); | ||||||
scoped_interpreter(bool init_signal_handlers = true, | ||||||
int argc = 0, | ||||||
char** argv = nullptr, | ||||||
bool add_program_dir_to_path = true) { | ||||||
initialize_interpreter(init_signal_handlers, argc, argv, add_program_dir_to_path); | ||||||
} | ||||||
|
||||||
scoped_interpreter(const scoped_interpreter &) = delete; | ||||||
|
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Nit: shouldn't we add an debug assert that argc >= 0? We are casting a signed int to an unsigned size_t
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
I think it's covered by the
argc <= 0
below, combined withargc = 1
.