diff --git a/include/pybind11/pytypes.h b/include/pybind11/pytypes.h index bea34cd936..00c791aada 100644 --- a/include/pybind11/pytypes.h +++ b/include/pybind11/pytypes.h @@ -920,7 +920,7 @@ class str : public object { Return a string representation of the object. This is analogous to the ``str()`` function in Python. \endrst */ - explicit str(handle h) : object(raw_str(h.ptr()), stolen_t{}) { } + explicit str(handle h) : object(raw_str(h.ptr()), stolen_t{}) { if (!m_ptr) throw error_already_set(); } operator std::string() const { object temp = *this; @@ -945,8 +945,8 @@ class str : public object { /// Return string representation -- always returns a new reference, even if already a str static PyObject *raw_str(PyObject *op) { PyObject *str_value = PyObject_Str(op); - if (!str_value) throw error_already_set(); #if PY_MAJOR_VERSION < 3 + if (!str_value) throw error_already_set(); PyObject *unicode = PyUnicode_FromEncodedObject(str_value, "utf-8", nullptr); Py_XDECREF(str_value); str_value = unicode; #endif diff --git a/tests/test_pytypes.cpp b/tests/test_pytypes.cpp index 925d6ffd27..4ef1b9ff0b 100644 --- a/tests/test_pytypes.cpp +++ b/tests/test_pytypes.cpp @@ -80,6 +80,7 @@ TEST_SUBMODULE(pytypes, m) { m.def("str_from_bytes", []() { return py::str(py::bytes("boo", 3)); }); m.def("str_from_object", [](const py::object& obj) { return py::str(obj); }); m.def("repr_from_object", [](const py::object& obj) { return py::repr(obj); }); + m.def("str_from_handle", [](py::handle h) { return py::str(h); }); m.def("str_format", []() { auto s1 = "{} + {} = {}"_s.format(1, 2, 3); diff --git a/tests/test_pytypes.py b/tests/test_pytypes.py index 277c170ebe..33a03c66ca 100644 --- a/tests/test_pytypes.py +++ b/tests/test_pytypes.py @@ -109,6 +109,16 @@ def __repr__(self): assert s1 == "1 + 2 = 3" assert s1 == s2 + assert m.str_from_handle(A()) == "this is a str" + + malformed_utf8 = b"\x80" + assert m.str_from_object(malformed_utf8) is malformed_utf8 # Probably surprising. + if env.PY2: + with pytest.raises(UnicodeDecodeError): + m.str_from_handle(malformed_utf8) + else: + assert m.str_from_handle(malformed_utf8) == "b'\\x80'" + def test_bytes(doc): assert m.bytes_from_string().decode() == "foo"