15ffd83dbSDimitry Andric //===-- PythonDataObjects.cpp ---------------------------------------------===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric 9480093f4SDimitry Andric #include "lldb/Host/Config.h" 100b57cec5SDimitry Andric 11480093f4SDimitry Andric #if LLDB_ENABLE_PYTHON 120b57cec5SDimitry Andric 130b57cec5SDimitry Andric #include "PythonDataObjects.h" 140b57cec5SDimitry Andric #include "ScriptInterpreterPython.h" 150b57cec5SDimitry Andric 160b57cec5SDimitry Andric #include "lldb/Host/File.h" 170b57cec5SDimitry Andric #include "lldb/Host/FileSystem.h" 180b57cec5SDimitry Andric #include "lldb/Interpreter/ScriptInterpreter.h" 199dba64beSDimitry Andric #include "lldb/Utility/Log.h" 200b57cec5SDimitry Andric #include "lldb/Utility/Stream.h" 210b57cec5SDimitry Andric 220b57cec5SDimitry Andric #include "llvm/ADT/StringSwitch.h" 239dba64beSDimitry Andric #include "llvm/Support/Casting.h" 240b57cec5SDimitry Andric #include "llvm/Support/ConvertUTF.h" 250b57cec5SDimitry Andric #include "llvm/Support/Errno.h" 260b57cec5SDimitry Andric 27fe6060f1SDimitry Andric #include <cstdio> 280b57cec5SDimitry Andric 290b57cec5SDimitry Andric using namespace lldb_private; 300b57cec5SDimitry Andric using namespace lldb; 319dba64beSDimitry Andric using namespace lldb_private::python; 329dba64beSDimitry Andric using llvm::cantFail; 339dba64beSDimitry Andric using llvm::Error; 349dba64beSDimitry Andric using llvm::Expected; 359dba64beSDimitry Andric using llvm::Twine; 360b57cec5SDimitry Andric 379dba64beSDimitry Andric template <> Expected<bool> python::As<bool>(Expected<PythonObject> &&obj) { 389dba64beSDimitry Andric if (!obj) 399dba64beSDimitry Andric return obj.takeError(); 409dba64beSDimitry Andric return obj.get().IsTrue(); 419dba64beSDimitry Andric } 429dba64beSDimitry Andric 439dba64beSDimitry Andric template <> 449dba64beSDimitry Andric Expected<long long> python::As<long long>(Expected<PythonObject> &&obj) { 459dba64beSDimitry Andric if (!obj) 469dba64beSDimitry Andric return obj.takeError(); 475ffd83dbSDimitry Andric return obj->AsLongLong(); 485ffd83dbSDimitry Andric } 495ffd83dbSDimitry Andric 505ffd83dbSDimitry Andric template <> 515ffd83dbSDimitry Andric Expected<unsigned long long> 525ffd83dbSDimitry Andric python::As<unsigned long long>(Expected<PythonObject> &&obj) { 535ffd83dbSDimitry Andric if (!obj) 545ffd83dbSDimitry Andric return obj.takeError(); 555ffd83dbSDimitry Andric return obj->AsUnsignedLongLong(); 569dba64beSDimitry Andric } 579dba64beSDimitry Andric 589dba64beSDimitry Andric template <> 599dba64beSDimitry Andric Expected<std::string> python::As<std::string>(Expected<PythonObject> &&obj) { 609dba64beSDimitry Andric if (!obj) 619dba64beSDimitry Andric return obj.takeError(); 629dba64beSDimitry Andric PyObject *str_obj = PyObject_Str(obj.get().get()); 639dba64beSDimitry Andric if (!obj) 649dba64beSDimitry Andric return llvm::make_error<PythonException>(); 659dba64beSDimitry Andric auto str = Take<PythonString>(str_obj); 669dba64beSDimitry Andric auto utf8 = str.AsUTF8(); 679dba64beSDimitry Andric if (!utf8) 689dba64beSDimitry Andric return utf8.takeError(); 695ffd83dbSDimitry Andric return std::string(utf8.get()); 705ffd83dbSDimitry Andric } 715ffd83dbSDimitry Andric 72*04eeddc0SDimitry Andric static bool python_is_finalizing() { 73*04eeddc0SDimitry Andric #if PY_MAJOR_VERSION == 2 74*04eeddc0SDimitry Andric return false; 75*04eeddc0SDimitry Andric #elif PY_MAJOR_VERSION == 3 && PY_MINOR_VERSION < 7 76*04eeddc0SDimitry Andric return _Py_Finalizing != nullptr; 77*04eeddc0SDimitry Andric #else 78*04eeddc0SDimitry Andric return _Py_IsFinalizing(); 79*04eeddc0SDimitry Andric #endif 80*04eeddc0SDimitry Andric } 81*04eeddc0SDimitry Andric 82*04eeddc0SDimitry Andric void PythonObject::Reset() { 83*04eeddc0SDimitry Andric if (m_py_obj && Py_IsInitialized()) { 84*04eeddc0SDimitry Andric if (python_is_finalizing()) { 85*04eeddc0SDimitry Andric // Leak m_py_obj rather than crashing the process. 86*04eeddc0SDimitry Andric // https://docs.python.org/3/c-api/init.html#c.PyGILState_Ensure 87*04eeddc0SDimitry Andric } else { 88*04eeddc0SDimitry Andric PyGILState_STATE state = PyGILState_Ensure(); 89*04eeddc0SDimitry Andric Py_DECREF(m_py_obj); 90*04eeddc0SDimitry Andric PyGILState_Release(state); 91*04eeddc0SDimitry Andric } 92*04eeddc0SDimitry Andric } 93*04eeddc0SDimitry Andric m_py_obj = nullptr; 94*04eeddc0SDimitry Andric } 95*04eeddc0SDimitry Andric 965ffd83dbSDimitry Andric Expected<long long> PythonObject::AsLongLong() const { 975ffd83dbSDimitry Andric if (!m_py_obj) 985ffd83dbSDimitry Andric return nullDeref(); 995ffd83dbSDimitry Andric #if PY_MAJOR_VERSION < 3 1005ffd83dbSDimitry Andric if (!PyLong_Check(m_py_obj)) { 1015ffd83dbSDimitry Andric PythonInteger i(PyRefType::Borrowed, m_py_obj); 1025ffd83dbSDimitry Andric return i.AsLongLong(); 1035ffd83dbSDimitry Andric } 1045ffd83dbSDimitry Andric #endif 1055ffd83dbSDimitry Andric assert(!PyErr_Occurred()); 1065ffd83dbSDimitry Andric long long r = PyLong_AsLongLong(m_py_obj); 1075ffd83dbSDimitry Andric if (PyErr_Occurred()) 1085ffd83dbSDimitry Andric return exception(); 1095ffd83dbSDimitry Andric return r; 1105ffd83dbSDimitry Andric } 1115ffd83dbSDimitry Andric 1125ffd83dbSDimitry Andric Expected<long long> PythonObject::AsUnsignedLongLong() const { 1135ffd83dbSDimitry Andric if (!m_py_obj) 1145ffd83dbSDimitry Andric return nullDeref(); 1155ffd83dbSDimitry Andric #if PY_MAJOR_VERSION < 3 1165ffd83dbSDimitry Andric if (!PyLong_Check(m_py_obj)) { 1175ffd83dbSDimitry Andric PythonInteger i(PyRefType::Borrowed, m_py_obj); 1185ffd83dbSDimitry Andric return i.AsUnsignedLongLong(); 1195ffd83dbSDimitry Andric } 1205ffd83dbSDimitry Andric #endif 1215ffd83dbSDimitry Andric assert(!PyErr_Occurred()); 1225ffd83dbSDimitry Andric long long r = PyLong_AsUnsignedLongLong(m_py_obj); 1235ffd83dbSDimitry Andric if (PyErr_Occurred()) 1245ffd83dbSDimitry Andric return exception(); 1255ffd83dbSDimitry Andric return r; 1265ffd83dbSDimitry Andric } 1275ffd83dbSDimitry Andric 1285ffd83dbSDimitry Andric // wraps on overflow, instead of raising an error. 1295ffd83dbSDimitry Andric Expected<unsigned long long> PythonObject::AsModuloUnsignedLongLong() const { 1305ffd83dbSDimitry Andric if (!m_py_obj) 1315ffd83dbSDimitry Andric return nullDeref(); 1325ffd83dbSDimitry Andric #if PY_MAJOR_VERSION < 3 1335ffd83dbSDimitry Andric if (!PyLong_Check(m_py_obj)) { 1345ffd83dbSDimitry Andric PythonInteger i(PyRefType::Borrowed, m_py_obj); 1355ffd83dbSDimitry Andric return i.AsModuloUnsignedLongLong(); 1365ffd83dbSDimitry Andric } 1375ffd83dbSDimitry Andric #endif 1385ffd83dbSDimitry Andric assert(!PyErr_Occurred()); 1395ffd83dbSDimitry Andric unsigned long long r = PyLong_AsUnsignedLongLongMask(m_py_obj); 1405ffd83dbSDimitry Andric if (PyErr_Occurred()) 1415ffd83dbSDimitry Andric return exception(); 1425ffd83dbSDimitry Andric return r; 1439dba64beSDimitry Andric } 1449dba64beSDimitry Andric 1459dba64beSDimitry Andric void StructuredPythonObject::Serialize(llvm::json::OStream &s) const { 1469dba64beSDimitry Andric s.value(llvm::formatv("Python Obj: {0:X}", GetValue()).str()); 1470b57cec5SDimitry Andric } 1480b57cec5SDimitry Andric 1490b57cec5SDimitry Andric // PythonObject 1500b57cec5SDimitry Andric 1510b57cec5SDimitry Andric void PythonObject::Dump(Stream &strm) const { 1520b57cec5SDimitry Andric if (m_py_obj) { 1530b57cec5SDimitry Andric FILE *file = llvm::sys::RetryAfterSignal(nullptr, ::tmpfile); 1540b57cec5SDimitry Andric if (file) { 1550b57cec5SDimitry Andric ::PyObject_Print(m_py_obj, file, 0); 1560b57cec5SDimitry Andric const long length = ftell(file); 1570b57cec5SDimitry Andric if (length) { 1580b57cec5SDimitry Andric ::rewind(file); 1590b57cec5SDimitry Andric std::vector<char> file_contents(length, '\0'); 1600b57cec5SDimitry Andric const size_t length_read = 1610b57cec5SDimitry Andric ::fread(file_contents.data(), 1, file_contents.size(), file); 1620b57cec5SDimitry Andric if (length_read > 0) 1630b57cec5SDimitry Andric strm.Write(file_contents.data(), length_read); 1640b57cec5SDimitry Andric } 1650b57cec5SDimitry Andric ::fclose(file); 1660b57cec5SDimitry Andric } 1670b57cec5SDimitry Andric } else 1680b57cec5SDimitry Andric strm.PutCString("NULL"); 1690b57cec5SDimitry Andric } 1700b57cec5SDimitry Andric 1710b57cec5SDimitry Andric PyObjectType PythonObject::GetObjectType() const { 1720b57cec5SDimitry Andric if (!IsAllocated()) 1730b57cec5SDimitry Andric return PyObjectType::None; 1740b57cec5SDimitry Andric 1750b57cec5SDimitry Andric if (PythonModule::Check(m_py_obj)) 1760b57cec5SDimitry Andric return PyObjectType::Module; 1770b57cec5SDimitry Andric if (PythonList::Check(m_py_obj)) 1780b57cec5SDimitry Andric return PyObjectType::List; 1790b57cec5SDimitry Andric if (PythonTuple::Check(m_py_obj)) 1800b57cec5SDimitry Andric return PyObjectType::Tuple; 1810b57cec5SDimitry Andric if (PythonDictionary::Check(m_py_obj)) 1820b57cec5SDimitry Andric return PyObjectType::Dictionary; 1830b57cec5SDimitry Andric if (PythonString::Check(m_py_obj)) 1840b57cec5SDimitry Andric return PyObjectType::String; 1850b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 1860b57cec5SDimitry Andric if (PythonBytes::Check(m_py_obj)) 1870b57cec5SDimitry Andric return PyObjectType::Bytes; 1880b57cec5SDimitry Andric #endif 1890b57cec5SDimitry Andric if (PythonByteArray::Check(m_py_obj)) 1900b57cec5SDimitry Andric return PyObjectType::ByteArray; 1910b57cec5SDimitry Andric if (PythonBoolean::Check(m_py_obj)) 1920b57cec5SDimitry Andric return PyObjectType::Boolean; 1930b57cec5SDimitry Andric if (PythonInteger::Check(m_py_obj)) 1940b57cec5SDimitry Andric return PyObjectType::Integer; 1950b57cec5SDimitry Andric if (PythonFile::Check(m_py_obj)) 1960b57cec5SDimitry Andric return PyObjectType::File; 1970b57cec5SDimitry Andric if (PythonCallable::Check(m_py_obj)) 1980b57cec5SDimitry Andric return PyObjectType::Callable; 1990b57cec5SDimitry Andric return PyObjectType::Unknown; 2000b57cec5SDimitry Andric } 2010b57cec5SDimitry Andric 2020b57cec5SDimitry Andric PythonString PythonObject::Repr() const { 2030b57cec5SDimitry Andric if (!m_py_obj) 2040b57cec5SDimitry Andric return PythonString(); 2050b57cec5SDimitry Andric PyObject *repr = PyObject_Repr(m_py_obj); 2060b57cec5SDimitry Andric if (!repr) 2070b57cec5SDimitry Andric return PythonString(); 2080b57cec5SDimitry Andric return PythonString(PyRefType::Owned, repr); 2090b57cec5SDimitry Andric } 2100b57cec5SDimitry Andric 2110b57cec5SDimitry Andric PythonString PythonObject::Str() const { 2120b57cec5SDimitry Andric if (!m_py_obj) 2130b57cec5SDimitry Andric return PythonString(); 2140b57cec5SDimitry Andric PyObject *str = PyObject_Str(m_py_obj); 2150b57cec5SDimitry Andric if (!str) 2160b57cec5SDimitry Andric return PythonString(); 2170b57cec5SDimitry Andric return PythonString(PyRefType::Owned, str); 2180b57cec5SDimitry Andric } 2190b57cec5SDimitry Andric 2200b57cec5SDimitry Andric PythonObject 2210b57cec5SDimitry Andric PythonObject::ResolveNameWithDictionary(llvm::StringRef name, 2220b57cec5SDimitry Andric const PythonDictionary &dict) { 2230b57cec5SDimitry Andric size_t dot_pos = name.find('.'); 2240b57cec5SDimitry Andric llvm::StringRef piece = name.substr(0, dot_pos); 2250b57cec5SDimitry Andric PythonObject result = dict.GetItemForKey(PythonString(piece)); 2260b57cec5SDimitry Andric if (dot_pos == llvm::StringRef::npos) { 2270b57cec5SDimitry Andric // There was no dot, we're done. 2280b57cec5SDimitry Andric return result; 2290b57cec5SDimitry Andric } 2300b57cec5SDimitry Andric 2310b57cec5SDimitry Andric // There was a dot. The remaining portion of the name should be looked up in 2320b57cec5SDimitry Andric // the context of the object that was found in the dictionary. 2330b57cec5SDimitry Andric return result.ResolveName(name.substr(dot_pos + 1)); 2340b57cec5SDimitry Andric } 2350b57cec5SDimitry Andric 2360b57cec5SDimitry Andric PythonObject PythonObject::ResolveName(llvm::StringRef name) const { 2370b57cec5SDimitry Andric // Resolve the name in the context of the specified object. If, for example, 2380b57cec5SDimitry Andric // `this` refers to a PyModule, then this will look for `name` in this 2390b57cec5SDimitry Andric // module. If `this` refers to a PyType, then it will resolve `name` as an 2400b57cec5SDimitry Andric // attribute of that type. If `this` refers to an instance of an object, 2410b57cec5SDimitry Andric // then it will resolve `name` as the value of the specified field. 2420b57cec5SDimitry Andric // 2430b57cec5SDimitry Andric // This function handles dotted names so that, for example, if `m_py_obj` 2440b57cec5SDimitry Andric // refers to the `sys` module, and `name` == "path.append", then it will find 2450b57cec5SDimitry Andric // the function `sys.path.append`. 2460b57cec5SDimitry Andric 2470b57cec5SDimitry Andric size_t dot_pos = name.find('.'); 2480b57cec5SDimitry Andric if (dot_pos == llvm::StringRef::npos) { 2490b57cec5SDimitry Andric // No dots in the name, we should be able to find the value immediately as 2500b57cec5SDimitry Andric // an attribute of `m_py_obj`. 2510b57cec5SDimitry Andric return GetAttributeValue(name); 2520b57cec5SDimitry Andric } 2530b57cec5SDimitry Andric 2540b57cec5SDimitry Andric // Look up the first piece of the name, and resolve the rest as a child of 2550b57cec5SDimitry Andric // that. 2560b57cec5SDimitry Andric PythonObject parent = ResolveName(name.substr(0, dot_pos)); 2570b57cec5SDimitry Andric if (!parent.IsAllocated()) 2580b57cec5SDimitry Andric return PythonObject(); 2590b57cec5SDimitry Andric 2600b57cec5SDimitry Andric // Tail recursion.. should be optimized by the compiler 2610b57cec5SDimitry Andric return parent.ResolveName(name.substr(dot_pos + 1)); 2620b57cec5SDimitry Andric } 2630b57cec5SDimitry Andric 2640b57cec5SDimitry Andric bool PythonObject::HasAttribute(llvm::StringRef attr) const { 2650b57cec5SDimitry Andric if (!IsValid()) 2660b57cec5SDimitry Andric return false; 2670b57cec5SDimitry Andric PythonString py_attr(attr); 2680b57cec5SDimitry Andric return !!PyObject_HasAttr(m_py_obj, py_attr.get()); 2690b57cec5SDimitry Andric } 2700b57cec5SDimitry Andric 2710b57cec5SDimitry Andric PythonObject PythonObject::GetAttributeValue(llvm::StringRef attr) const { 2720b57cec5SDimitry Andric if (!IsValid()) 2730b57cec5SDimitry Andric return PythonObject(); 2740b57cec5SDimitry Andric 2750b57cec5SDimitry Andric PythonString py_attr(attr); 2760b57cec5SDimitry Andric if (!PyObject_HasAttr(m_py_obj, py_attr.get())) 2770b57cec5SDimitry Andric return PythonObject(); 2780b57cec5SDimitry Andric 2790b57cec5SDimitry Andric return PythonObject(PyRefType::Owned, 2800b57cec5SDimitry Andric PyObject_GetAttr(m_py_obj, py_attr.get())); 2810b57cec5SDimitry Andric } 2820b57cec5SDimitry Andric 2830b57cec5SDimitry Andric StructuredData::ObjectSP PythonObject::CreateStructuredObject() const { 284*04eeddc0SDimitry Andric #if PY_MAJOR_VERSION >= 3 285*04eeddc0SDimitry Andric assert(PyGILState_Check()); 286*04eeddc0SDimitry Andric #endif 2870b57cec5SDimitry Andric switch (GetObjectType()) { 2880b57cec5SDimitry Andric case PyObjectType::Dictionary: 2890b57cec5SDimitry Andric return PythonDictionary(PyRefType::Borrowed, m_py_obj) 2900b57cec5SDimitry Andric .CreateStructuredDictionary(); 2910b57cec5SDimitry Andric case PyObjectType::Boolean: 2920b57cec5SDimitry Andric return PythonBoolean(PyRefType::Borrowed, m_py_obj) 2930b57cec5SDimitry Andric .CreateStructuredBoolean(); 2940b57cec5SDimitry Andric case PyObjectType::Integer: 2950b57cec5SDimitry Andric return PythonInteger(PyRefType::Borrowed, m_py_obj) 2960b57cec5SDimitry Andric .CreateStructuredInteger(); 2970b57cec5SDimitry Andric case PyObjectType::List: 2980b57cec5SDimitry Andric return PythonList(PyRefType::Borrowed, m_py_obj).CreateStructuredArray(); 2990b57cec5SDimitry Andric case PyObjectType::String: 3000b57cec5SDimitry Andric return PythonString(PyRefType::Borrowed, m_py_obj).CreateStructuredString(); 3010b57cec5SDimitry Andric case PyObjectType::Bytes: 3020b57cec5SDimitry Andric return PythonBytes(PyRefType::Borrowed, m_py_obj).CreateStructuredString(); 3030b57cec5SDimitry Andric case PyObjectType::ByteArray: 3040b57cec5SDimitry Andric return PythonByteArray(PyRefType::Borrowed, m_py_obj) 3050b57cec5SDimitry Andric .CreateStructuredString(); 3060b57cec5SDimitry Andric case PyObjectType::None: 3070b57cec5SDimitry Andric return StructuredData::ObjectSP(); 3080b57cec5SDimitry Andric default: 309*04eeddc0SDimitry Andric return StructuredData::ObjectSP(new StructuredPythonObject( 310*04eeddc0SDimitry Andric PythonObject(PyRefType::Borrowed, m_py_obj))); 3110b57cec5SDimitry Andric } 3120b57cec5SDimitry Andric } 3130b57cec5SDimitry Andric 3140b57cec5SDimitry Andric // PythonString 3150b57cec5SDimitry Andric 3169dba64beSDimitry Andric PythonBytes::PythonBytes(llvm::ArrayRef<uint8_t> bytes) { SetBytes(bytes); } 3170b57cec5SDimitry Andric 3189dba64beSDimitry Andric PythonBytes::PythonBytes(const uint8_t *bytes, size_t length) { 3190b57cec5SDimitry Andric SetBytes(llvm::ArrayRef<uint8_t>(bytes, length)); 3200b57cec5SDimitry Andric } 3210b57cec5SDimitry Andric 3220b57cec5SDimitry Andric bool PythonBytes::Check(PyObject *py_obj) { 3230b57cec5SDimitry Andric if (!py_obj) 3240b57cec5SDimitry Andric return false; 3250b57cec5SDimitry Andric return PyBytes_Check(py_obj); 3260b57cec5SDimitry Andric } 3270b57cec5SDimitry Andric 3280b57cec5SDimitry Andric llvm::ArrayRef<uint8_t> PythonBytes::GetBytes() const { 3290b57cec5SDimitry Andric if (!IsValid()) 3300b57cec5SDimitry Andric return llvm::ArrayRef<uint8_t>(); 3310b57cec5SDimitry Andric 3320b57cec5SDimitry Andric Py_ssize_t size; 3330b57cec5SDimitry Andric char *c; 3340b57cec5SDimitry Andric 3350b57cec5SDimitry Andric PyBytes_AsStringAndSize(m_py_obj, &c, &size); 3360b57cec5SDimitry Andric return llvm::ArrayRef<uint8_t>(reinterpret_cast<uint8_t *>(c), size); 3370b57cec5SDimitry Andric } 3380b57cec5SDimitry Andric 3390b57cec5SDimitry Andric size_t PythonBytes::GetSize() const { 3400b57cec5SDimitry Andric if (!IsValid()) 3410b57cec5SDimitry Andric return 0; 3420b57cec5SDimitry Andric return PyBytes_Size(m_py_obj); 3430b57cec5SDimitry Andric } 3440b57cec5SDimitry Andric 3450b57cec5SDimitry Andric void PythonBytes::SetBytes(llvm::ArrayRef<uint8_t> bytes) { 3460b57cec5SDimitry Andric const char *data = reinterpret_cast<const char *>(bytes.data()); 3479dba64beSDimitry Andric *this = Take<PythonBytes>(PyBytes_FromStringAndSize(data, bytes.size())); 3480b57cec5SDimitry Andric } 3490b57cec5SDimitry Andric 3500b57cec5SDimitry Andric StructuredData::StringSP PythonBytes::CreateStructuredString() const { 3510b57cec5SDimitry Andric StructuredData::StringSP result(new StructuredData::String); 3520b57cec5SDimitry Andric Py_ssize_t size; 3530b57cec5SDimitry Andric char *c; 3540b57cec5SDimitry Andric PyBytes_AsStringAndSize(m_py_obj, &c, &size); 3550b57cec5SDimitry Andric result->SetValue(std::string(c, size)); 3560b57cec5SDimitry Andric return result; 3570b57cec5SDimitry Andric } 3580b57cec5SDimitry Andric 3590b57cec5SDimitry Andric PythonByteArray::PythonByteArray(llvm::ArrayRef<uint8_t> bytes) 3600b57cec5SDimitry Andric : PythonByteArray(bytes.data(), bytes.size()) {} 3610b57cec5SDimitry Andric 3620b57cec5SDimitry Andric PythonByteArray::PythonByteArray(const uint8_t *bytes, size_t length) { 3630b57cec5SDimitry Andric const char *str = reinterpret_cast<const char *>(bytes); 3649dba64beSDimitry Andric *this = Take<PythonByteArray>(PyByteArray_FromStringAndSize(str, length)); 3650b57cec5SDimitry Andric } 3660b57cec5SDimitry Andric 3670b57cec5SDimitry Andric bool PythonByteArray::Check(PyObject *py_obj) { 3680b57cec5SDimitry Andric if (!py_obj) 3690b57cec5SDimitry Andric return false; 3700b57cec5SDimitry Andric return PyByteArray_Check(py_obj); 3710b57cec5SDimitry Andric } 3720b57cec5SDimitry Andric 3730b57cec5SDimitry Andric llvm::ArrayRef<uint8_t> PythonByteArray::GetBytes() const { 3740b57cec5SDimitry Andric if (!IsValid()) 3750b57cec5SDimitry Andric return llvm::ArrayRef<uint8_t>(); 3760b57cec5SDimitry Andric 3770b57cec5SDimitry Andric char *c = PyByteArray_AsString(m_py_obj); 3780b57cec5SDimitry Andric size_t size = GetSize(); 3790b57cec5SDimitry Andric return llvm::ArrayRef<uint8_t>(reinterpret_cast<uint8_t *>(c), size); 3800b57cec5SDimitry Andric } 3810b57cec5SDimitry Andric 3820b57cec5SDimitry Andric size_t PythonByteArray::GetSize() const { 3830b57cec5SDimitry Andric if (!IsValid()) 3840b57cec5SDimitry Andric return 0; 3850b57cec5SDimitry Andric 3860b57cec5SDimitry Andric return PyByteArray_Size(m_py_obj); 3870b57cec5SDimitry Andric } 3880b57cec5SDimitry Andric 3890b57cec5SDimitry Andric StructuredData::StringSP PythonByteArray::CreateStructuredString() const { 3900b57cec5SDimitry Andric StructuredData::StringSP result(new StructuredData::String); 3910b57cec5SDimitry Andric llvm::ArrayRef<uint8_t> bytes = GetBytes(); 3920b57cec5SDimitry Andric const char *str = reinterpret_cast<const char *>(bytes.data()); 3930b57cec5SDimitry Andric result->SetValue(std::string(str, bytes.size())); 3940b57cec5SDimitry Andric return result; 3950b57cec5SDimitry Andric } 3960b57cec5SDimitry Andric 3970b57cec5SDimitry Andric // PythonString 3980b57cec5SDimitry Andric 3999dba64beSDimitry Andric Expected<PythonString> PythonString::FromUTF8(llvm::StringRef string) { 4009dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 4019dba64beSDimitry Andric PyObject *str = PyUnicode_FromStringAndSize(string.data(), string.size()); 4029dba64beSDimitry Andric #else 4039dba64beSDimitry Andric PyObject *str = PyString_FromStringAndSize(string.data(), string.size()); 4049dba64beSDimitry Andric #endif 4059dba64beSDimitry Andric if (!str) 4069dba64beSDimitry Andric return llvm::make_error<PythonException>(); 4079dba64beSDimitry Andric return Take<PythonString>(str); 4080b57cec5SDimitry Andric } 4090b57cec5SDimitry Andric 4109dba64beSDimitry Andric PythonString::PythonString(llvm::StringRef string) { SetString(string); } 4110b57cec5SDimitry Andric 4120b57cec5SDimitry Andric bool PythonString::Check(PyObject *py_obj) { 4130b57cec5SDimitry Andric if (!py_obj) 4140b57cec5SDimitry Andric return false; 4150b57cec5SDimitry Andric 4160b57cec5SDimitry Andric if (PyUnicode_Check(py_obj)) 4170b57cec5SDimitry Andric return true; 4180b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3 4190b57cec5SDimitry Andric if (PyString_Check(py_obj)) 4200b57cec5SDimitry Andric return true; 4210b57cec5SDimitry Andric #endif 4220b57cec5SDimitry Andric return false; 4230b57cec5SDimitry Andric } 4240b57cec5SDimitry Andric 4259dba64beSDimitry Andric void PythonString::Convert(PyRefType &type, PyObject *&py_obj) { 4260b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3 4270b57cec5SDimitry Andric // In Python 2, Don't store PyUnicode objects directly, because we need 4280b57cec5SDimitry Andric // access to their underlying character buffers which Python 2 doesn't 4290b57cec5SDimitry Andric // provide. 4309dba64beSDimitry Andric if (PyUnicode_Check(py_obj)) { 4319dba64beSDimitry Andric PyObject *s = PyUnicode_AsUTF8String(py_obj); 4329dba64beSDimitry Andric if (s == nullptr) { 4339dba64beSDimitry Andric PyErr_Clear(); 4349dba64beSDimitry Andric if (type == PyRefType::Owned) 4359dba64beSDimitry Andric Py_DECREF(py_obj); 4369dba64beSDimitry Andric return; 4379dba64beSDimitry Andric } 4389dba64beSDimitry Andric if (type == PyRefType::Owned) 4399dba64beSDimitry Andric Py_DECREF(py_obj); 4409dba64beSDimitry Andric else 4419dba64beSDimitry Andric type = PyRefType::Owned; 4429dba64beSDimitry Andric py_obj = s; 4439dba64beSDimitry Andric } 4440b57cec5SDimitry Andric #endif 4450b57cec5SDimitry Andric } 4460b57cec5SDimitry Andric 4470b57cec5SDimitry Andric llvm::StringRef PythonString::GetString() const { 4489dba64beSDimitry Andric auto s = AsUTF8(); 4499dba64beSDimitry Andric if (!s) { 4509dba64beSDimitry Andric llvm::consumeError(s.takeError()); 4519dba64beSDimitry Andric return llvm::StringRef(""); 4529dba64beSDimitry Andric } 4539dba64beSDimitry Andric return s.get(); 4549dba64beSDimitry Andric } 4559dba64beSDimitry Andric 4569dba64beSDimitry Andric Expected<llvm::StringRef> PythonString::AsUTF8() const { 4570b57cec5SDimitry Andric if (!IsValid()) 4589dba64beSDimitry Andric return nullDeref(); 4590b57cec5SDimitry Andric 4600b57cec5SDimitry Andric Py_ssize_t size; 4610b57cec5SDimitry Andric const char *data; 4620b57cec5SDimitry Andric 4630b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 4640b57cec5SDimitry Andric data = PyUnicode_AsUTF8AndSize(m_py_obj, &size); 4650b57cec5SDimitry Andric #else 4669dba64beSDimitry Andric char *c = NULL; 4679dba64beSDimitry Andric int r = PyString_AsStringAndSize(m_py_obj, &c, &size); 4689dba64beSDimitry Andric if (r < 0) 4699dba64beSDimitry Andric c = NULL; 4700b57cec5SDimitry Andric data = c; 4710b57cec5SDimitry Andric #endif 4729dba64beSDimitry Andric 4739dba64beSDimitry Andric if (!data) 4749dba64beSDimitry Andric return exception(); 4759dba64beSDimitry Andric 4760b57cec5SDimitry Andric return llvm::StringRef(data, size); 4770b57cec5SDimitry Andric } 4780b57cec5SDimitry Andric 4790b57cec5SDimitry Andric size_t PythonString::GetSize() const { 4800b57cec5SDimitry Andric if (IsValid()) { 4810b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 482e8d8bef9SDimitry Andric #if PY_MINOR_VERSION >= 3 483e8d8bef9SDimitry Andric return PyUnicode_GetLength(m_py_obj); 484e8d8bef9SDimitry Andric #else 4850b57cec5SDimitry Andric return PyUnicode_GetSize(m_py_obj); 486e8d8bef9SDimitry Andric #endif 4870b57cec5SDimitry Andric #else 4880b57cec5SDimitry Andric return PyString_Size(m_py_obj); 4890b57cec5SDimitry Andric #endif 4900b57cec5SDimitry Andric } 4910b57cec5SDimitry Andric return 0; 4920b57cec5SDimitry Andric } 4930b57cec5SDimitry Andric 4940b57cec5SDimitry Andric void PythonString::SetString(llvm::StringRef string) { 4959dba64beSDimitry Andric auto s = FromUTF8(string); 4969dba64beSDimitry Andric if (!s) { 4979dba64beSDimitry Andric llvm::consumeError(s.takeError()); 4989dba64beSDimitry Andric Reset(); 4999dba64beSDimitry Andric } else { 5009dba64beSDimitry Andric *this = std::move(s.get()); 5019dba64beSDimitry Andric } 5020b57cec5SDimitry Andric } 5030b57cec5SDimitry Andric 5040b57cec5SDimitry Andric StructuredData::StringSP PythonString::CreateStructuredString() const { 5050b57cec5SDimitry Andric StructuredData::StringSP result(new StructuredData::String); 5060b57cec5SDimitry Andric result->SetValue(GetString()); 5070b57cec5SDimitry Andric return result; 5080b57cec5SDimitry Andric } 5090b57cec5SDimitry Andric 5100b57cec5SDimitry Andric // PythonInteger 5110b57cec5SDimitry Andric 5129dba64beSDimitry Andric PythonInteger::PythonInteger(int64_t value) { SetInteger(value); } 5130b57cec5SDimitry Andric 5140b57cec5SDimitry Andric bool PythonInteger::Check(PyObject *py_obj) { 5150b57cec5SDimitry Andric if (!py_obj) 5160b57cec5SDimitry Andric return false; 5170b57cec5SDimitry Andric 5180b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 5190b57cec5SDimitry Andric // Python 3 does not have PyInt_Check. There is only one type of integral 5200b57cec5SDimitry Andric // value, long. 5210b57cec5SDimitry Andric return PyLong_Check(py_obj); 5220b57cec5SDimitry Andric #else 5230b57cec5SDimitry Andric return PyLong_Check(py_obj) || PyInt_Check(py_obj); 5240b57cec5SDimitry Andric #endif 5250b57cec5SDimitry Andric } 5260b57cec5SDimitry Andric 5279dba64beSDimitry Andric void PythonInteger::Convert(PyRefType &type, PyObject *&py_obj) { 5280b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3 5290b57cec5SDimitry Andric // Always store this as a PyLong, which makes interoperability between Python 5300b57cec5SDimitry Andric // 2.x and Python 3.x easier. This is only necessary in 2.x, since 3.x 5310b57cec5SDimitry Andric // doesn't even have a PyInt. 5320b57cec5SDimitry Andric if (PyInt_Check(py_obj)) { 5330b57cec5SDimitry Andric // Since we converted the original object to a different type, the new 5340b57cec5SDimitry Andric // object is an owned object regardless of the ownership semantics 5350b57cec5SDimitry Andric // requested by the user. 5369dba64beSDimitry Andric long long value = PyInt_AsLong(py_obj); 5379dba64beSDimitry Andric PyObject *l = nullptr; 5389dba64beSDimitry Andric if (!PyErr_Occurred()) 5399dba64beSDimitry Andric l = PyLong_FromLongLong(value); 5409dba64beSDimitry Andric if (l == nullptr) { 5419dba64beSDimitry Andric PyErr_Clear(); 5429dba64beSDimitry Andric if (type == PyRefType::Owned) 5439dba64beSDimitry Andric Py_DECREF(py_obj); 5449dba64beSDimitry Andric return; 5459dba64beSDimitry Andric } 5469dba64beSDimitry Andric if (type == PyRefType::Owned) 5479dba64beSDimitry Andric Py_DECREF(py_obj); 5489dba64beSDimitry Andric else 5499dba64beSDimitry Andric type = PyRefType::Owned; 5509dba64beSDimitry Andric py_obj = l; 5510b57cec5SDimitry Andric } 5520b57cec5SDimitry Andric #endif 5530b57cec5SDimitry Andric } 5540b57cec5SDimitry Andric 5550b57cec5SDimitry Andric void PythonInteger::SetInteger(int64_t value) { 5569dba64beSDimitry Andric *this = Take<PythonInteger>(PyLong_FromLongLong(value)); 5570b57cec5SDimitry Andric } 5580b57cec5SDimitry Andric 5590b57cec5SDimitry Andric StructuredData::IntegerSP PythonInteger::CreateStructuredInteger() const { 5600b57cec5SDimitry Andric StructuredData::IntegerSP result(new StructuredData::Integer); 5615ffd83dbSDimitry Andric // FIXME this is really not ideal. Errors are silently converted to 0 5625ffd83dbSDimitry Andric // and overflows are silently wrapped. But we'd need larger changes 5635ffd83dbSDimitry Andric // to StructuredData to fix it, so that's how it is for now. 5645ffd83dbSDimitry Andric llvm::Expected<unsigned long long> value = AsModuloUnsignedLongLong(); 5655ffd83dbSDimitry Andric if (!value) { 5665ffd83dbSDimitry Andric llvm::consumeError(value.takeError()); 5675ffd83dbSDimitry Andric result->SetValue(0); 5685ffd83dbSDimitry Andric } else { 5695ffd83dbSDimitry Andric result->SetValue(value.get()); 5705ffd83dbSDimitry Andric } 5710b57cec5SDimitry Andric return result; 5720b57cec5SDimitry Andric } 5730b57cec5SDimitry Andric 5740b57cec5SDimitry Andric // PythonBoolean 5750b57cec5SDimitry Andric 5760b57cec5SDimitry Andric PythonBoolean::PythonBoolean(bool value) { 5770b57cec5SDimitry Andric SetValue(value); 5780b57cec5SDimitry Andric } 5790b57cec5SDimitry Andric 5800b57cec5SDimitry Andric bool PythonBoolean::Check(PyObject *py_obj) { 5810b57cec5SDimitry Andric return py_obj ? PyBool_Check(py_obj) : false; 5820b57cec5SDimitry Andric } 5830b57cec5SDimitry Andric 5840b57cec5SDimitry Andric bool PythonBoolean::GetValue() const { 5850b57cec5SDimitry Andric return m_py_obj ? PyObject_IsTrue(m_py_obj) : false; 5860b57cec5SDimitry Andric } 5870b57cec5SDimitry Andric 5880b57cec5SDimitry Andric void PythonBoolean::SetValue(bool value) { 5899dba64beSDimitry Andric *this = Take<PythonBoolean>(PyBool_FromLong(value)); 5900b57cec5SDimitry Andric } 5910b57cec5SDimitry Andric 5920b57cec5SDimitry Andric StructuredData::BooleanSP PythonBoolean::CreateStructuredBoolean() const { 5930b57cec5SDimitry Andric StructuredData::BooleanSP result(new StructuredData::Boolean); 5940b57cec5SDimitry Andric result->SetValue(GetValue()); 5950b57cec5SDimitry Andric return result; 5960b57cec5SDimitry Andric } 5970b57cec5SDimitry Andric 5980b57cec5SDimitry Andric // PythonList 5990b57cec5SDimitry Andric 6009dba64beSDimitry Andric PythonList::PythonList(PyInitialValue value) { 6010b57cec5SDimitry Andric if (value == PyInitialValue::Empty) 6029dba64beSDimitry Andric *this = Take<PythonList>(PyList_New(0)); 6030b57cec5SDimitry Andric } 6040b57cec5SDimitry Andric 6059dba64beSDimitry Andric PythonList::PythonList(int list_size) { 6069dba64beSDimitry Andric *this = Take<PythonList>(PyList_New(list_size)); 6070b57cec5SDimitry Andric } 6080b57cec5SDimitry Andric 6090b57cec5SDimitry Andric bool PythonList::Check(PyObject *py_obj) { 6100b57cec5SDimitry Andric if (!py_obj) 6110b57cec5SDimitry Andric return false; 6120b57cec5SDimitry Andric return PyList_Check(py_obj); 6130b57cec5SDimitry Andric } 6140b57cec5SDimitry Andric 6150b57cec5SDimitry Andric uint32_t PythonList::GetSize() const { 6160b57cec5SDimitry Andric if (IsValid()) 6170b57cec5SDimitry Andric return PyList_GET_SIZE(m_py_obj); 6180b57cec5SDimitry Andric return 0; 6190b57cec5SDimitry Andric } 6200b57cec5SDimitry Andric 6210b57cec5SDimitry Andric PythonObject PythonList::GetItemAtIndex(uint32_t index) const { 6220b57cec5SDimitry Andric if (IsValid()) 6230b57cec5SDimitry Andric return PythonObject(PyRefType::Borrowed, PyList_GetItem(m_py_obj, index)); 6240b57cec5SDimitry Andric return PythonObject(); 6250b57cec5SDimitry Andric } 6260b57cec5SDimitry Andric 6270b57cec5SDimitry Andric void PythonList::SetItemAtIndex(uint32_t index, const PythonObject &object) { 6280b57cec5SDimitry Andric if (IsAllocated() && object.IsValid()) { 6290b57cec5SDimitry Andric // PyList_SetItem is documented to "steal" a reference, so we need to 6300b57cec5SDimitry Andric // convert it to an owned reference by incrementing it. 6310b57cec5SDimitry Andric Py_INCREF(object.get()); 6320b57cec5SDimitry Andric PyList_SetItem(m_py_obj, index, object.get()); 6330b57cec5SDimitry Andric } 6340b57cec5SDimitry Andric } 6350b57cec5SDimitry Andric 6360b57cec5SDimitry Andric void PythonList::AppendItem(const PythonObject &object) { 6370b57cec5SDimitry Andric if (IsAllocated() && object.IsValid()) { 6380b57cec5SDimitry Andric // `PyList_Append` does *not* steal a reference, so do not call `Py_INCREF` 6390b57cec5SDimitry Andric // here like we do with `PyList_SetItem`. 6400b57cec5SDimitry Andric PyList_Append(m_py_obj, object.get()); 6410b57cec5SDimitry Andric } 6420b57cec5SDimitry Andric } 6430b57cec5SDimitry Andric 6440b57cec5SDimitry Andric StructuredData::ArraySP PythonList::CreateStructuredArray() const { 6450b57cec5SDimitry Andric StructuredData::ArraySP result(new StructuredData::Array); 6460b57cec5SDimitry Andric uint32_t count = GetSize(); 6470b57cec5SDimitry Andric for (uint32_t i = 0; i < count; ++i) { 6480b57cec5SDimitry Andric PythonObject obj = GetItemAtIndex(i); 6490b57cec5SDimitry Andric result->AddItem(obj.CreateStructuredObject()); 6500b57cec5SDimitry Andric } 6510b57cec5SDimitry Andric return result; 6520b57cec5SDimitry Andric } 6530b57cec5SDimitry Andric 6540b57cec5SDimitry Andric // PythonTuple 6550b57cec5SDimitry Andric 6569dba64beSDimitry Andric PythonTuple::PythonTuple(PyInitialValue value) { 6570b57cec5SDimitry Andric if (value == PyInitialValue::Empty) 6589dba64beSDimitry Andric *this = Take<PythonTuple>(PyTuple_New(0)); 6590b57cec5SDimitry Andric } 6600b57cec5SDimitry Andric 6619dba64beSDimitry Andric PythonTuple::PythonTuple(int tuple_size) { 6629dba64beSDimitry Andric *this = Take<PythonTuple>(PyTuple_New(tuple_size)); 6630b57cec5SDimitry Andric } 6640b57cec5SDimitry Andric 6650b57cec5SDimitry Andric PythonTuple::PythonTuple(std::initializer_list<PythonObject> objects) { 6660b57cec5SDimitry Andric m_py_obj = PyTuple_New(objects.size()); 6670b57cec5SDimitry Andric 6680b57cec5SDimitry Andric uint32_t idx = 0; 6690b57cec5SDimitry Andric for (auto object : objects) { 6700b57cec5SDimitry Andric if (object.IsValid()) 6710b57cec5SDimitry Andric SetItemAtIndex(idx, object); 6720b57cec5SDimitry Andric idx++; 6730b57cec5SDimitry Andric } 6740b57cec5SDimitry Andric } 6750b57cec5SDimitry Andric 6760b57cec5SDimitry Andric PythonTuple::PythonTuple(std::initializer_list<PyObject *> objects) { 6770b57cec5SDimitry Andric m_py_obj = PyTuple_New(objects.size()); 6780b57cec5SDimitry Andric 6790b57cec5SDimitry Andric uint32_t idx = 0; 6800b57cec5SDimitry Andric for (auto py_object : objects) { 6810b57cec5SDimitry Andric PythonObject object(PyRefType::Borrowed, py_object); 6820b57cec5SDimitry Andric if (object.IsValid()) 6830b57cec5SDimitry Andric SetItemAtIndex(idx, object); 6840b57cec5SDimitry Andric idx++; 6850b57cec5SDimitry Andric } 6860b57cec5SDimitry Andric } 6870b57cec5SDimitry Andric 6880b57cec5SDimitry Andric bool PythonTuple::Check(PyObject *py_obj) { 6890b57cec5SDimitry Andric if (!py_obj) 6900b57cec5SDimitry Andric return false; 6910b57cec5SDimitry Andric return PyTuple_Check(py_obj); 6920b57cec5SDimitry Andric } 6930b57cec5SDimitry Andric 6940b57cec5SDimitry Andric uint32_t PythonTuple::GetSize() const { 6950b57cec5SDimitry Andric if (IsValid()) 6960b57cec5SDimitry Andric return PyTuple_GET_SIZE(m_py_obj); 6970b57cec5SDimitry Andric return 0; 6980b57cec5SDimitry Andric } 6990b57cec5SDimitry Andric 7000b57cec5SDimitry Andric PythonObject PythonTuple::GetItemAtIndex(uint32_t index) const { 7010b57cec5SDimitry Andric if (IsValid()) 7020b57cec5SDimitry Andric return PythonObject(PyRefType::Borrowed, PyTuple_GetItem(m_py_obj, index)); 7030b57cec5SDimitry Andric return PythonObject(); 7040b57cec5SDimitry Andric } 7050b57cec5SDimitry Andric 7060b57cec5SDimitry Andric void PythonTuple::SetItemAtIndex(uint32_t index, const PythonObject &object) { 7070b57cec5SDimitry Andric if (IsAllocated() && object.IsValid()) { 7080b57cec5SDimitry Andric // PyTuple_SetItem is documented to "steal" a reference, so we need to 7090b57cec5SDimitry Andric // convert it to an owned reference by incrementing it. 7100b57cec5SDimitry Andric Py_INCREF(object.get()); 7110b57cec5SDimitry Andric PyTuple_SetItem(m_py_obj, index, object.get()); 7120b57cec5SDimitry Andric } 7130b57cec5SDimitry Andric } 7140b57cec5SDimitry Andric 7150b57cec5SDimitry Andric StructuredData::ArraySP PythonTuple::CreateStructuredArray() const { 7160b57cec5SDimitry Andric StructuredData::ArraySP result(new StructuredData::Array); 7170b57cec5SDimitry Andric uint32_t count = GetSize(); 7180b57cec5SDimitry Andric for (uint32_t i = 0; i < count; ++i) { 7190b57cec5SDimitry Andric PythonObject obj = GetItemAtIndex(i); 7200b57cec5SDimitry Andric result->AddItem(obj.CreateStructuredObject()); 7210b57cec5SDimitry Andric } 7220b57cec5SDimitry Andric return result; 7230b57cec5SDimitry Andric } 7240b57cec5SDimitry Andric 7250b57cec5SDimitry Andric // PythonDictionary 7260b57cec5SDimitry Andric 7279dba64beSDimitry Andric PythonDictionary::PythonDictionary(PyInitialValue value) { 7280b57cec5SDimitry Andric if (value == PyInitialValue::Empty) 7299dba64beSDimitry Andric *this = Take<PythonDictionary>(PyDict_New()); 7300b57cec5SDimitry Andric } 7310b57cec5SDimitry Andric 7320b57cec5SDimitry Andric bool PythonDictionary::Check(PyObject *py_obj) { 7330b57cec5SDimitry Andric if (!py_obj) 7340b57cec5SDimitry Andric return false; 7350b57cec5SDimitry Andric 7360b57cec5SDimitry Andric return PyDict_Check(py_obj); 7370b57cec5SDimitry Andric } 7380b57cec5SDimitry Andric 7390b57cec5SDimitry Andric uint32_t PythonDictionary::GetSize() const { 7400b57cec5SDimitry Andric if (IsValid()) 7410b57cec5SDimitry Andric return PyDict_Size(m_py_obj); 7420b57cec5SDimitry Andric return 0; 7430b57cec5SDimitry Andric } 7440b57cec5SDimitry Andric 7450b57cec5SDimitry Andric PythonList PythonDictionary::GetKeys() const { 7460b57cec5SDimitry Andric if (IsValid()) 7470b57cec5SDimitry Andric return PythonList(PyRefType::Owned, PyDict_Keys(m_py_obj)); 7480b57cec5SDimitry Andric return PythonList(PyInitialValue::Invalid); 7490b57cec5SDimitry Andric } 7500b57cec5SDimitry Andric 7510b57cec5SDimitry Andric PythonObject PythonDictionary::GetItemForKey(const PythonObject &key) const { 7529dba64beSDimitry Andric auto item = GetItem(key); 7539dba64beSDimitry Andric if (!item) { 7549dba64beSDimitry Andric llvm::consumeError(item.takeError()); 7550b57cec5SDimitry Andric return PythonObject(); 7560b57cec5SDimitry Andric } 7579dba64beSDimitry Andric return std::move(item.get()); 7589dba64beSDimitry Andric } 7599dba64beSDimitry Andric 7609dba64beSDimitry Andric Expected<PythonObject> 7619dba64beSDimitry Andric PythonDictionary::GetItem(const PythonObject &key) const { 7629dba64beSDimitry Andric if (!IsValid()) 7639dba64beSDimitry Andric return nullDeref(); 7649dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 7659dba64beSDimitry Andric PyObject *o = PyDict_GetItemWithError(m_py_obj, key.get()); 7669dba64beSDimitry Andric if (PyErr_Occurred()) 7679dba64beSDimitry Andric return exception(); 7689dba64beSDimitry Andric #else 7699dba64beSDimitry Andric PyObject *o = PyDict_GetItem(m_py_obj, key.get()); 7709dba64beSDimitry Andric #endif 7719dba64beSDimitry Andric if (!o) 7729dba64beSDimitry Andric return keyError(); 7739dba64beSDimitry Andric return Retain<PythonObject>(o); 7749dba64beSDimitry Andric } 7759dba64beSDimitry Andric 7769dba64beSDimitry Andric Expected<PythonObject> PythonDictionary::GetItem(const Twine &key) const { 7779dba64beSDimitry Andric if (!IsValid()) 7789dba64beSDimitry Andric return nullDeref(); 7799dba64beSDimitry Andric PyObject *o = PyDict_GetItemString(m_py_obj, NullTerminated(key)); 7809dba64beSDimitry Andric if (PyErr_Occurred()) 7819dba64beSDimitry Andric return exception(); 7829dba64beSDimitry Andric if (!o) 7839dba64beSDimitry Andric return keyError(); 7849dba64beSDimitry Andric return Retain<PythonObject>(o); 7859dba64beSDimitry Andric } 7869dba64beSDimitry Andric 7879dba64beSDimitry Andric Error PythonDictionary::SetItem(const PythonObject &key, 7889dba64beSDimitry Andric const PythonObject &value) const { 7899dba64beSDimitry Andric if (!IsValid() || !value.IsValid()) 7909dba64beSDimitry Andric return nullDeref(); 7919dba64beSDimitry Andric int r = PyDict_SetItem(m_py_obj, key.get(), value.get()); 7929dba64beSDimitry Andric if (r < 0) 7939dba64beSDimitry Andric return exception(); 7949dba64beSDimitry Andric return Error::success(); 7959dba64beSDimitry Andric } 7969dba64beSDimitry Andric 7979dba64beSDimitry Andric Error PythonDictionary::SetItem(const Twine &key, 7989dba64beSDimitry Andric const PythonObject &value) const { 7999dba64beSDimitry Andric if (!IsValid() || !value.IsValid()) 8009dba64beSDimitry Andric return nullDeref(); 8019dba64beSDimitry Andric int r = PyDict_SetItemString(m_py_obj, NullTerminated(key), value.get()); 8029dba64beSDimitry Andric if (r < 0) 8039dba64beSDimitry Andric return exception(); 8049dba64beSDimitry Andric return Error::success(); 8059dba64beSDimitry Andric } 8060b57cec5SDimitry Andric 8070b57cec5SDimitry Andric void PythonDictionary::SetItemForKey(const PythonObject &key, 8080b57cec5SDimitry Andric const PythonObject &value) { 8099dba64beSDimitry Andric Error error = SetItem(key, value); 8109dba64beSDimitry Andric if (error) 8119dba64beSDimitry Andric llvm::consumeError(std::move(error)); 8120b57cec5SDimitry Andric } 8130b57cec5SDimitry Andric 8140b57cec5SDimitry Andric StructuredData::DictionarySP 8150b57cec5SDimitry Andric PythonDictionary::CreateStructuredDictionary() const { 8160b57cec5SDimitry Andric StructuredData::DictionarySP result(new StructuredData::Dictionary); 8170b57cec5SDimitry Andric PythonList keys(GetKeys()); 8180b57cec5SDimitry Andric uint32_t num_keys = keys.GetSize(); 8190b57cec5SDimitry Andric for (uint32_t i = 0; i < num_keys; ++i) { 8200b57cec5SDimitry Andric PythonObject key = keys.GetItemAtIndex(i); 8210b57cec5SDimitry Andric PythonObject value = GetItemForKey(key); 8220b57cec5SDimitry Andric StructuredData::ObjectSP structured_value = value.CreateStructuredObject(); 8230b57cec5SDimitry Andric result->AddItem(key.Str().GetString(), structured_value); 8240b57cec5SDimitry Andric } 8250b57cec5SDimitry Andric return result; 8260b57cec5SDimitry Andric } 8270b57cec5SDimitry Andric 8280b57cec5SDimitry Andric PythonModule PythonModule::BuiltinsModule() { 8290b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 8300b57cec5SDimitry Andric return AddModule("builtins"); 8310b57cec5SDimitry Andric #else 8320b57cec5SDimitry Andric return AddModule("__builtin__"); 8330b57cec5SDimitry Andric #endif 8340b57cec5SDimitry Andric } 8350b57cec5SDimitry Andric 8360b57cec5SDimitry Andric PythonModule PythonModule::MainModule() { return AddModule("__main__"); } 8370b57cec5SDimitry Andric 8380b57cec5SDimitry Andric PythonModule PythonModule::AddModule(llvm::StringRef module) { 8390b57cec5SDimitry Andric std::string str = module.str(); 8400b57cec5SDimitry Andric return PythonModule(PyRefType::Borrowed, PyImport_AddModule(str.c_str())); 8410b57cec5SDimitry Andric } 8420b57cec5SDimitry Andric 8439dba64beSDimitry Andric Expected<PythonModule> PythonModule::Import(const Twine &name) { 8449dba64beSDimitry Andric PyObject *mod = PyImport_ImportModule(NullTerminated(name)); 8459dba64beSDimitry Andric if (!mod) 8469dba64beSDimitry Andric return exception(); 8479dba64beSDimitry Andric return Take<PythonModule>(mod); 8489dba64beSDimitry Andric } 8499dba64beSDimitry Andric 8509dba64beSDimitry Andric Expected<PythonObject> PythonModule::Get(const Twine &name) { 8519dba64beSDimitry Andric if (!IsValid()) 8529dba64beSDimitry Andric return nullDeref(); 8539dba64beSDimitry Andric PyObject *dict = PyModule_GetDict(m_py_obj); 8549dba64beSDimitry Andric if (!dict) 8559dba64beSDimitry Andric return exception(); 8569dba64beSDimitry Andric PyObject *item = PyDict_GetItemString(dict, NullTerminated(name)); 8579dba64beSDimitry Andric if (!item) 8589dba64beSDimitry Andric return exception(); 8599dba64beSDimitry Andric return Retain<PythonObject>(item); 8600b57cec5SDimitry Andric } 8610b57cec5SDimitry Andric 8620b57cec5SDimitry Andric bool PythonModule::Check(PyObject *py_obj) { 8630b57cec5SDimitry Andric if (!py_obj) 8640b57cec5SDimitry Andric return false; 8650b57cec5SDimitry Andric 8660b57cec5SDimitry Andric return PyModule_Check(py_obj); 8670b57cec5SDimitry Andric } 8680b57cec5SDimitry Andric 8690b57cec5SDimitry Andric PythonDictionary PythonModule::GetDictionary() const { 8709dba64beSDimitry Andric if (!IsValid()) 8719dba64beSDimitry Andric return PythonDictionary(); 8729dba64beSDimitry Andric return Retain<PythonDictionary>(PyModule_GetDict(m_py_obj)); 8730b57cec5SDimitry Andric } 8740b57cec5SDimitry Andric 8750b57cec5SDimitry Andric bool PythonCallable::Check(PyObject *py_obj) { 8760b57cec5SDimitry Andric if (!py_obj) 8770b57cec5SDimitry Andric return false; 8780b57cec5SDimitry Andric 8790b57cec5SDimitry Andric return PyCallable_Check(py_obj); 8800b57cec5SDimitry Andric } 8810b57cec5SDimitry Andric 8829dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 && PY_MINOR_VERSION >= 3 8839dba64beSDimitry Andric static const char get_arg_info_script[] = R"( 8849dba64beSDimitry Andric from inspect import signature, Parameter, ismethod 8859dba64beSDimitry Andric from collections import namedtuple 886480093f4SDimitry Andric ArgInfo = namedtuple('ArgInfo', ['count', 'has_varargs']) 8879dba64beSDimitry Andric def main(f): 8889dba64beSDimitry Andric count = 0 8899dba64beSDimitry Andric varargs = False 8909dba64beSDimitry Andric for parameter in signature(f).parameters.values(): 8919dba64beSDimitry Andric kind = parameter.kind 8929dba64beSDimitry Andric if kind in (Parameter.POSITIONAL_ONLY, 8939dba64beSDimitry Andric Parameter.POSITIONAL_OR_KEYWORD): 8949dba64beSDimitry Andric count += 1 8959dba64beSDimitry Andric elif kind == Parameter.VAR_POSITIONAL: 8969dba64beSDimitry Andric varargs = True 8979dba64beSDimitry Andric elif kind in (Parameter.KEYWORD_ONLY, 8989dba64beSDimitry Andric Parameter.VAR_KEYWORD): 8999dba64beSDimitry Andric pass 9009dba64beSDimitry Andric else: 9019dba64beSDimitry Andric raise Exception(f'unknown parameter kind: {kind}') 902480093f4SDimitry Andric return ArgInfo(count, varargs) 9039dba64beSDimitry Andric )"; 9049dba64beSDimitry Andric #endif 9059dba64beSDimitry Andric 9069dba64beSDimitry Andric Expected<PythonCallable::ArgInfo> PythonCallable::GetArgInfo() const { 9079dba64beSDimitry Andric ArgInfo result = {}; 9089dba64beSDimitry Andric if (!IsValid()) 9099dba64beSDimitry Andric return nullDeref(); 9109dba64beSDimitry Andric 9119dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 && PY_MINOR_VERSION >= 3 9129dba64beSDimitry Andric 9139dba64beSDimitry Andric // no need to synchronize access to this global, we already have the GIL 9149dba64beSDimitry Andric static PythonScript get_arg_info(get_arg_info_script); 9159dba64beSDimitry Andric Expected<PythonObject> pyarginfo = get_arg_info(*this); 9169dba64beSDimitry Andric if (!pyarginfo) 9179dba64beSDimitry Andric return pyarginfo.takeError(); 918480093f4SDimitry Andric long long count = 919480093f4SDimitry Andric cantFail(As<long long>(pyarginfo.get().GetAttribute("count"))); 920480093f4SDimitry Andric bool has_varargs = 9219dba64beSDimitry Andric cantFail(As<bool>(pyarginfo.get().GetAttribute("has_varargs"))); 922480093f4SDimitry Andric result.max_positional_args = has_varargs ? ArgInfo::UNBOUNDED : count; 9239dba64beSDimitry Andric 9249dba64beSDimitry Andric #else 925480093f4SDimitry Andric PyObject *py_func_obj; 9269dba64beSDimitry Andric bool is_bound_method = false; 927480093f4SDimitry Andric bool is_class = false; 928480093f4SDimitry Andric 929480093f4SDimitry Andric if (PyType_Check(m_py_obj) || PyClass_Check(m_py_obj)) { 930480093f4SDimitry Andric auto init = GetAttribute("__init__"); 931480093f4SDimitry Andric if (!init) 932480093f4SDimitry Andric return init.takeError(); 933480093f4SDimitry Andric py_func_obj = init.get().get(); 934480093f4SDimitry Andric is_class = true; 935480093f4SDimitry Andric } else { 936480093f4SDimitry Andric py_func_obj = m_py_obj; 937480093f4SDimitry Andric } 938480093f4SDimitry Andric 9390b57cec5SDimitry Andric if (PyMethod_Check(py_func_obj)) { 9400b57cec5SDimitry Andric py_func_obj = PyMethod_GET_FUNCTION(py_func_obj); 9410b57cec5SDimitry Andric PythonObject im_self = GetAttributeValue("im_self"); 9420b57cec5SDimitry Andric if (im_self.IsValid() && !im_self.IsNone()) 9439dba64beSDimitry Andric is_bound_method = true; 9440b57cec5SDimitry Andric } else { 9450b57cec5SDimitry Andric // see if this is a callable object with an __call__ method 9460b57cec5SDimitry Andric if (!PyFunction_Check(py_func_obj)) { 9470b57cec5SDimitry Andric PythonObject __call__ = GetAttributeValue("__call__"); 9480b57cec5SDimitry Andric if (__call__.IsValid()) { 9490b57cec5SDimitry Andric auto __callable__ = __call__.AsType<PythonCallable>(); 9500b57cec5SDimitry Andric if (__callable__.IsValid()) { 9510b57cec5SDimitry Andric py_func_obj = PyMethod_GET_FUNCTION(__callable__.get()); 9529dba64beSDimitry Andric PythonObject im_self = __callable__.GetAttributeValue("im_self"); 9530b57cec5SDimitry Andric if (im_self.IsValid() && !im_self.IsNone()) 9549dba64beSDimitry Andric is_bound_method = true; 9550b57cec5SDimitry Andric } 9560b57cec5SDimitry Andric } 9570b57cec5SDimitry Andric } 9580b57cec5SDimitry Andric } 9590b57cec5SDimitry Andric 9600b57cec5SDimitry Andric if (!py_func_obj) 9610b57cec5SDimitry Andric return result; 9620b57cec5SDimitry Andric 9630b57cec5SDimitry Andric PyCodeObject *code = (PyCodeObject *)PyFunction_GET_CODE(py_func_obj); 9640b57cec5SDimitry Andric if (!code) 9650b57cec5SDimitry Andric return result; 9660b57cec5SDimitry Andric 967480093f4SDimitry Andric auto count = code->co_argcount; 968480093f4SDimitry Andric bool has_varargs = !!(code->co_flags & CO_VARARGS); 969480093f4SDimitry Andric result.max_positional_args = 970480093f4SDimitry Andric has_varargs ? ArgInfo::UNBOUNDED 971480093f4SDimitry Andric : (count - (int)is_bound_method) - (int)is_class; 9729dba64beSDimitry Andric 9739dba64beSDimitry Andric #endif 9749dba64beSDimitry Andric 9750b57cec5SDimitry Andric return result; 9760b57cec5SDimitry Andric } 9770b57cec5SDimitry Andric 9789dba64beSDimitry Andric constexpr unsigned 9799dba64beSDimitry Andric PythonCallable::ArgInfo::UNBOUNDED; // FIXME delete after c++17 9809dba64beSDimitry Andric 9810b57cec5SDimitry Andric PythonObject PythonCallable::operator()() { 9820b57cec5SDimitry Andric return PythonObject(PyRefType::Owned, PyObject_CallObject(m_py_obj, nullptr)); 9830b57cec5SDimitry Andric } 9840b57cec5SDimitry Andric 9850b57cec5SDimitry Andric PythonObject PythonCallable:: 9860b57cec5SDimitry Andric operator()(std::initializer_list<PyObject *> args) { 9870b57cec5SDimitry Andric PythonTuple arg_tuple(args); 9880b57cec5SDimitry Andric return PythonObject(PyRefType::Owned, 9890b57cec5SDimitry Andric PyObject_CallObject(m_py_obj, arg_tuple.get())); 9900b57cec5SDimitry Andric } 9910b57cec5SDimitry Andric 9920b57cec5SDimitry Andric PythonObject PythonCallable:: 9930b57cec5SDimitry Andric operator()(std::initializer_list<PythonObject> args) { 9940b57cec5SDimitry Andric PythonTuple arg_tuple(args); 9950b57cec5SDimitry Andric return PythonObject(PyRefType::Owned, 9960b57cec5SDimitry Andric PyObject_CallObject(m_py_obj, arg_tuple.get())); 9970b57cec5SDimitry Andric } 9980b57cec5SDimitry Andric 9990b57cec5SDimitry Andric bool PythonFile::Check(PyObject *py_obj) { 10009dba64beSDimitry Andric if (!py_obj) 10019dba64beSDimitry Andric return false; 10020b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3 10030b57cec5SDimitry Andric return PyFile_Check(py_obj); 10040b57cec5SDimitry Andric #else 10050b57cec5SDimitry Andric // In Python 3, there is no `PyFile_Check`, and in fact PyFile is not even a 10060b57cec5SDimitry Andric // first-class object type anymore. `PyFile_FromFd` is just a thin wrapper 10070b57cec5SDimitry Andric // over `io.open()`, which returns some object derived from `io.IOBase`. As a 10080b57cec5SDimitry Andric // result, the only way to detect a file in Python 3 is to check whether it 10099dba64beSDimitry Andric // inherits from `io.IOBase`. 10109dba64beSDimitry Andric auto io_module = PythonModule::Import("io"); 10119dba64beSDimitry Andric if (!io_module) { 10129dba64beSDimitry Andric llvm::consumeError(io_module.takeError()); 10130b57cec5SDimitry Andric return false; 10149dba64beSDimitry Andric } 10159dba64beSDimitry Andric auto iobase = io_module.get().Get("IOBase"); 10169dba64beSDimitry Andric if (!iobase) { 10179dba64beSDimitry Andric llvm::consumeError(iobase.takeError()); 10180b57cec5SDimitry Andric return false; 10199dba64beSDimitry Andric } 10209dba64beSDimitry Andric int r = PyObject_IsInstance(py_obj, iobase.get().get()); 10219dba64beSDimitry Andric if (r < 0) { 10229dba64beSDimitry Andric llvm::consumeError(exception()); // clear the exception and log it. 10239dba64beSDimitry Andric return false; 10249dba64beSDimitry Andric } 10259dba64beSDimitry Andric return !!r; 10260b57cec5SDimitry Andric #endif 10270b57cec5SDimitry Andric } 10280b57cec5SDimitry Andric 10299dba64beSDimitry Andric const char *PythonException::toCString() const { 10309dba64beSDimitry Andric if (!m_repr_bytes) 10319dba64beSDimitry Andric return "unknown exception"; 10329dba64beSDimitry Andric return PyBytes_AS_STRING(m_repr_bytes); 10330b57cec5SDimitry Andric } 10340b57cec5SDimitry Andric 10359dba64beSDimitry Andric PythonException::PythonException(const char *caller) { 10369dba64beSDimitry Andric assert(PyErr_Occurred()); 10379dba64beSDimitry Andric m_exception_type = m_exception = m_traceback = m_repr_bytes = NULL; 10389dba64beSDimitry Andric PyErr_Fetch(&m_exception_type, &m_exception, &m_traceback); 10399dba64beSDimitry Andric PyErr_NormalizeException(&m_exception_type, &m_exception, &m_traceback); 10409dba64beSDimitry Andric PyErr_Clear(); 10419dba64beSDimitry Andric if (m_exception) { 10429dba64beSDimitry Andric PyObject *repr = PyObject_Repr(m_exception); 10439dba64beSDimitry Andric if (repr) { 10449dba64beSDimitry Andric m_repr_bytes = PyUnicode_AsEncodedString(repr, "utf-8", nullptr); 10459dba64beSDimitry Andric if (!m_repr_bytes) { 10469dba64beSDimitry Andric PyErr_Clear(); 10479dba64beSDimitry Andric } 10489dba64beSDimitry Andric Py_XDECREF(repr); 10499dba64beSDimitry Andric } else { 10509dba64beSDimitry Andric PyErr_Clear(); 10519dba64beSDimitry Andric } 10529dba64beSDimitry Andric } 10539dba64beSDimitry Andric Log *log = GetLogIfAllCategoriesSet(LIBLLDB_LOG_SCRIPT); 10549dba64beSDimitry Andric if (caller) 10559dba64beSDimitry Andric LLDB_LOGF(log, "%s failed with exception: %s", caller, toCString()); 10569dba64beSDimitry Andric else 10579dba64beSDimitry Andric LLDB_LOGF(log, "python exception: %s", toCString()); 10589dba64beSDimitry Andric } 10599dba64beSDimitry Andric void PythonException::Restore() { 10609dba64beSDimitry Andric if (m_exception_type && m_exception) { 10619dba64beSDimitry Andric PyErr_Restore(m_exception_type, m_exception, m_traceback); 10629dba64beSDimitry Andric } else { 10639dba64beSDimitry Andric PyErr_SetString(PyExc_Exception, toCString()); 10649dba64beSDimitry Andric } 10659dba64beSDimitry Andric m_exception_type = m_exception = m_traceback = NULL; 10660b57cec5SDimitry Andric } 10670b57cec5SDimitry Andric 10689dba64beSDimitry Andric PythonException::~PythonException() { 10699dba64beSDimitry Andric Py_XDECREF(m_exception_type); 10709dba64beSDimitry Andric Py_XDECREF(m_exception); 10719dba64beSDimitry Andric Py_XDECREF(m_traceback); 10729dba64beSDimitry Andric Py_XDECREF(m_repr_bytes); 10730b57cec5SDimitry Andric } 10740b57cec5SDimitry Andric 10759dba64beSDimitry Andric void PythonException::log(llvm::raw_ostream &OS) const { OS << toCString(); } 10769dba64beSDimitry Andric 10779dba64beSDimitry Andric std::error_code PythonException::convertToErrorCode() const { 10789dba64beSDimitry Andric return llvm::inconvertibleErrorCode(); 10799dba64beSDimitry Andric } 10809dba64beSDimitry Andric 10819dba64beSDimitry Andric bool PythonException::Matches(PyObject *exc) const { 10829dba64beSDimitry Andric return PyErr_GivenExceptionMatches(m_exception_type, exc); 10839dba64beSDimitry Andric } 10849dba64beSDimitry Andric 10859dba64beSDimitry Andric const char read_exception_script[] = R"( 10869dba64beSDimitry Andric import sys 10879dba64beSDimitry Andric from traceback import print_exception 10889dba64beSDimitry Andric if sys.version_info.major < 3: 10899dba64beSDimitry Andric from StringIO import StringIO 10909dba64beSDimitry Andric else: 10919dba64beSDimitry Andric from io import StringIO 10929dba64beSDimitry Andric def main(exc_type, exc_value, tb): 10939dba64beSDimitry Andric f = StringIO() 10949dba64beSDimitry Andric print_exception(exc_type, exc_value, tb, file=f) 10959dba64beSDimitry Andric return f.getvalue() 10969dba64beSDimitry Andric )"; 10979dba64beSDimitry Andric 10989dba64beSDimitry Andric std::string PythonException::ReadBacktrace() const { 10999dba64beSDimitry Andric 11009dba64beSDimitry Andric if (!m_traceback) 11019dba64beSDimitry Andric return toCString(); 11029dba64beSDimitry Andric 11039dba64beSDimitry Andric // no need to synchronize access to this global, we already have the GIL 11049dba64beSDimitry Andric static PythonScript read_exception(read_exception_script); 11059dba64beSDimitry Andric 11069dba64beSDimitry Andric Expected<std::string> backtrace = As<std::string>( 11079dba64beSDimitry Andric read_exception(m_exception_type, m_exception, m_traceback)); 11089dba64beSDimitry Andric 11099dba64beSDimitry Andric if (!backtrace) { 11109dba64beSDimitry Andric std::string message = 11119dba64beSDimitry Andric std::string(toCString()) + "\n" + 11125ffd83dbSDimitry Andric "Traceback unavailable, an error occurred while reading it:\n"; 11139dba64beSDimitry Andric return (message + llvm::toString(backtrace.takeError())); 11149dba64beSDimitry Andric } 11159dba64beSDimitry Andric 11169dba64beSDimitry Andric return std::move(backtrace.get()); 11179dba64beSDimitry Andric } 11189dba64beSDimitry Andric 11199dba64beSDimitry Andric char PythonException::ID = 0; 11209dba64beSDimitry Andric 11219dba64beSDimitry Andric llvm::Expected<File::OpenOptions> 11229dba64beSDimitry Andric GetOptionsForPyObject(const PythonObject &obj) { 11230b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 11249dba64beSDimitry Andric auto options = File::OpenOptions(0); 11259dba64beSDimitry Andric auto readable = As<bool>(obj.CallMethod("readable")); 11269dba64beSDimitry Andric if (!readable) 11279dba64beSDimitry Andric return readable.takeError(); 11289dba64beSDimitry Andric auto writable = As<bool>(obj.CallMethod("writable")); 11299dba64beSDimitry Andric if (!writable) 11309dba64beSDimitry Andric return writable.takeError(); 1131349cc55cSDimitry Andric if (readable.get() && writable.get()) 1132349cc55cSDimitry Andric options |= File::eOpenOptionReadWrite; 1133349cc55cSDimitry Andric else if (writable.get()) 1134349cc55cSDimitry Andric options |= File::eOpenOptionWriteOnly; 1135349cc55cSDimitry Andric else if (readable.get()) 1136349cc55cSDimitry Andric options |= File::eOpenOptionReadOnly; 11379dba64beSDimitry Andric return options; 11389dba64beSDimitry Andric #else 11399dba64beSDimitry Andric PythonString py_mode = obj.GetAttributeValue("mode").AsType<PythonString>(); 11409dba64beSDimitry Andric return File::GetOptionsFromMode(py_mode.GetString()); 11419dba64beSDimitry Andric #endif 11429dba64beSDimitry Andric } 11439dba64beSDimitry Andric 11449dba64beSDimitry Andric // Base class template for python files. All it knows how to do 11459dba64beSDimitry Andric // is hold a reference to the python object and close or flush it 11469dba64beSDimitry Andric // when the File is closed. 11479dba64beSDimitry Andric namespace { 11489dba64beSDimitry Andric template <typename Base> class OwnedPythonFile : public Base { 11499dba64beSDimitry Andric public: 11509dba64beSDimitry Andric template <typename... Args> 11519dba64beSDimitry Andric OwnedPythonFile(const PythonFile &file, bool borrowed, Args... args) 11529dba64beSDimitry Andric : Base(args...), m_py_obj(file), m_borrowed(borrowed) { 11539dba64beSDimitry Andric assert(m_py_obj); 11549dba64beSDimitry Andric } 11559dba64beSDimitry Andric 11569dba64beSDimitry Andric ~OwnedPythonFile() override { 11579dba64beSDimitry Andric assert(m_py_obj); 11589dba64beSDimitry Andric GIL takeGIL; 11599dba64beSDimitry Andric Close(); 11609dba64beSDimitry Andric // we need to ensure the python object is released while we still 11619dba64beSDimitry Andric // hold the GIL 11629dba64beSDimitry Andric m_py_obj.Reset(); 11639dba64beSDimitry Andric } 11649dba64beSDimitry Andric 11659dba64beSDimitry Andric bool IsPythonSideValid() const { 11669dba64beSDimitry Andric GIL takeGIL; 11679dba64beSDimitry Andric auto closed = As<bool>(m_py_obj.GetAttribute("closed")); 11689dba64beSDimitry Andric if (!closed) { 11699dba64beSDimitry Andric llvm::consumeError(closed.takeError()); 11709dba64beSDimitry Andric return false; 11719dba64beSDimitry Andric } 11729dba64beSDimitry Andric return !closed.get(); 11739dba64beSDimitry Andric } 11749dba64beSDimitry Andric 11759dba64beSDimitry Andric bool IsValid() const override { 11769dba64beSDimitry Andric return IsPythonSideValid() && Base::IsValid(); 11779dba64beSDimitry Andric } 11789dba64beSDimitry Andric 11799dba64beSDimitry Andric Status Close() override { 11809dba64beSDimitry Andric assert(m_py_obj); 11819dba64beSDimitry Andric Status py_error, base_error; 11829dba64beSDimitry Andric GIL takeGIL; 11839dba64beSDimitry Andric if (!m_borrowed) { 11849dba64beSDimitry Andric auto r = m_py_obj.CallMethod("close"); 11859dba64beSDimitry Andric if (!r) 11869dba64beSDimitry Andric py_error = Status(r.takeError()); 11879dba64beSDimitry Andric } 11889dba64beSDimitry Andric base_error = Base::Close(); 11899dba64beSDimitry Andric if (py_error.Fail()) 11909dba64beSDimitry Andric return py_error; 11919dba64beSDimitry Andric return base_error; 11929dba64beSDimitry Andric }; 11939dba64beSDimitry Andric 11949dba64beSDimitry Andric PyObject *GetPythonObject() const { 11959dba64beSDimitry Andric assert(m_py_obj.IsValid()); 11969dba64beSDimitry Andric return m_py_obj.get(); 11979dba64beSDimitry Andric } 11989dba64beSDimitry Andric 11999dba64beSDimitry Andric static bool classof(const File *file) = delete; 12009dba64beSDimitry Andric 12019dba64beSDimitry Andric protected: 12029dba64beSDimitry Andric PythonFile m_py_obj; 12039dba64beSDimitry Andric bool m_borrowed; 12049dba64beSDimitry Andric }; 12059dba64beSDimitry Andric } // namespace 12069dba64beSDimitry Andric 12079dba64beSDimitry Andric // A SimplePythonFile is a OwnedPythonFile that just does all I/O as 12089dba64beSDimitry Andric // a NativeFile 12099dba64beSDimitry Andric namespace { 12109dba64beSDimitry Andric class SimplePythonFile : public OwnedPythonFile<NativeFile> { 12119dba64beSDimitry Andric public: 12129dba64beSDimitry Andric SimplePythonFile(const PythonFile &file, bool borrowed, int fd, 12139dba64beSDimitry Andric File::OpenOptions options) 12149dba64beSDimitry Andric : OwnedPythonFile(file, borrowed, fd, options, false) {} 12159dba64beSDimitry Andric 12169dba64beSDimitry Andric static char ID; 12179dba64beSDimitry Andric bool isA(const void *classID) const override { 12189dba64beSDimitry Andric return classID == &ID || NativeFile::isA(classID); 12199dba64beSDimitry Andric } 12209dba64beSDimitry Andric static bool classof(const File *file) { return file->isA(&ID); } 12219dba64beSDimitry Andric }; 12229dba64beSDimitry Andric char SimplePythonFile::ID = 0; 12239dba64beSDimitry Andric } // namespace 12249dba64beSDimitry Andric 12259dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 12269dba64beSDimitry Andric 12279dba64beSDimitry Andric namespace { 12289dba64beSDimitry Andric class PythonBuffer { 12299dba64beSDimitry Andric public: 12309dba64beSDimitry Andric PythonBuffer &operator=(const PythonBuffer &) = delete; 12319dba64beSDimitry Andric PythonBuffer(const PythonBuffer &) = delete; 12329dba64beSDimitry Andric 12339dba64beSDimitry Andric static Expected<PythonBuffer> Create(PythonObject &obj, 12349dba64beSDimitry Andric int flags = PyBUF_SIMPLE) { 12359dba64beSDimitry Andric Py_buffer py_buffer = {}; 12369dba64beSDimitry Andric PyObject_GetBuffer(obj.get(), &py_buffer, flags); 12379dba64beSDimitry Andric if (!py_buffer.obj) 12389dba64beSDimitry Andric return llvm::make_error<PythonException>(); 12399dba64beSDimitry Andric return PythonBuffer(py_buffer); 12409dba64beSDimitry Andric } 12419dba64beSDimitry Andric 12429dba64beSDimitry Andric PythonBuffer(PythonBuffer &&other) { 12439dba64beSDimitry Andric m_buffer = other.m_buffer; 12449dba64beSDimitry Andric other.m_buffer.obj = nullptr; 12459dba64beSDimitry Andric } 12469dba64beSDimitry Andric 12479dba64beSDimitry Andric ~PythonBuffer() { 12489dba64beSDimitry Andric if (m_buffer.obj) 12499dba64beSDimitry Andric PyBuffer_Release(&m_buffer); 12509dba64beSDimitry Andric } 12519dba64beSDimitry Andric 12529dba64beSDimitry Andric Py_buffer &get() { return m_buffer; } 12539dba64beSDimitry Andric 12549dba64beSDimitry Andric private: 12559dba64beSDimitry Andric // takes ownership of the buffer. 12569dba64beSDimitry Andric PythonBuffer(const Py_buffer &py_buffer) : m_buffer(py_buffer) {} 12579dba64beSDimitry Andric Py_buffer m_buffer; 12589dba64beSDimitry Andric }; 12599dba64beSDimitry Andric } // namespace 12609dba64beSDimitry Andric 12619dba64beSDimitry Andric // Shared methods between TextPythonFile and BinaryPythonFile 12629dba64beSDimitry Andric namespace { 12639dba64beSDimitry Andric class PythonIOFile : public OwnedPythonFile<File> { 12649dba64beSDimitry Andric public: 12659dba64beSDimitry Andric PythonIOFile(const PythonFile &file, bool borrowed) 12669dba64beSDimitry Andric : OwnedPythonFile(file, borrowed) {} 12679dba64beSDimitry Andric 12689dba64beSDimitry Andric ~PythonIOFile() override { Close(); } 12699dba64beSDimitry Andric 12709dba64beSDimitry Andric bool IsValid() const override { return IsPythonSideValid(); } 12719dba64beSDimitry Andric 12729dba64beSDimitry Andric Status Close() override { 12739dba64beSDimitry Andric assert(m_py_obj); 12749dba64beSDimitry Andric GIL takeGIL; 12759dba64beSDimitry Andric if (m_borrowed) 12769dba64beSDimitry Andric return Flush(); 12779dba64beSDimitry Andric auto r = m_py_obj.CallMethod("close"); 12789dba64beSDimitry Andric if (!r) 12799dba64beSDimitry Andric return Status(r.takeError()); 12809dba64beSDimitry Andric return Status(); 12819dba64beSDimitry Andric } 12829dba64beSDimitry Andric 12839dba64beSDimitry Andric Status Flush() override { 12849dba64beSDimitry Andric GIL takeGIL; 12859dba64beSDimitry Andric auto r = m_py_obj.CallMethod("flush"); 12869dba64beSDimitry Andric if (!r) 12879dba64beSDimitry Andric return Status(r.takeError()); 12889dba64beSDimitry Andric return Status(); 12899dba64beSDimitry Andric } 12909dba64beSDimitry Andric 12919dba64beSDimitry Andric Expected<File::OpenOptions> GetOptions() const override { 12929dba64beSDimitry Andric GIL takeGIL; 12939dba64beSDimitry Andric return GetOptionsForPyObject(m_py_obj); 12949dba64beSDimitry Andric } 12959dba64beSDimitry Andric 12969dba64beSDimitry Andric static char ID; 12979dba64beSDimitry Andric bool isA(const void *classID) const override { 12989dba64beSDimitry Andric return classID == &ID || File::isA(classID); 12999dba64beSDimitry Andric } 13009dba64beSDimitry Andric static bool classof(const File *file) { return file->isA(&ID); } 13019dba64beSDimitry Andric }; 13029dba64beSDimitry Andric char PythonIOFile::ID = 0; 13039dba64beSDimitry Andric } // namespace 13049dba64beSDimitry Andric 13059dba64beSDimitry Andric namespace { 13069dba64beSDimitry Andric class BinaryPythonFile : public PythonIOFile { 13079dba64beSDimitry Andric protected: 13089dba64beSDimitry Andric int m_descriptor; 13099dba64beSDimitry Andric 13109dba64beSDimitry Andric public: 13119dba64beSDimitry Andric BinaryPythonFile(int fd, const PythonFile &file, bool borrowed) 13129dba64beSDimitry Andric : PythonIOFile(file, borrowed), 13139dba64beSDimitry Andric m_descriptor(File::DescriptorIsValid(fd) ? fd 13149dba64beSDimitry Andric : File::kInvalidDescriptor) {} 13159dba64beSDimitry Andric 13169dba64beSDimitry Andric int GetDescriptor() const override { return m_descriptor; } 13179dba64beSDimitry Andric 13189dba64beSDimitry Andric Status Write(const void *buf, size_t &num_bytes) override { 13199dba64beSDimitry Andric GIL takeGIL; 13209dba64beSDimitry Andric PyObject *pybuffer_p = PyMemoryView_FromMemory( 13219dba64beSDimitry Andric const_cast<char *>((const char *)buf), num_bytes, PyBUF_READ); 13229dba64beSDimitry Andric if (!pybuffer_p) 13239dba64beSDimitry Andric return Status(llvm::make_error<PythonException>()); 13249dba64beSDimitry Andric auto pybuffer = Take<PythonObject>(pybuffer_p); 13259dba64beSDimitry Andric num_bytes = 0; 13269dba64beSDimitry Andric auto bytes_written = As<long long>(m_py_obj.CallMethod("write", pybuffer)); 13279dba64beSDimitry Andric if (!bytes_written) 13289dba64beSDimitry Andric return Status(bytes_written.takeError()); 13299dba64beSDimitry Andric if (bytes_written.get() < 0) 13309dba64beSDimitry Andric return Status(".write() method returned a negative number!"); 13319dba64beSDimitry Andric static_assert(sizeof(long long) >= sizeof(size_t), "overflow"); 13329dba64beSDimitry Andric num_bytes = bytes_written.get(); 13339dba64beSDimitry Andric return Status(); 13349dba64beSDimitry Andric } 13359dba64beSDimitry Andric 13369dba64beSDimitry Andric Status Read(void *buf, size_t &num_bytes) override { 13379dba64beSDimitry Andric GIL takeGIL; 13389dba64beSDimitry Andric static_assert(sizeof(long long) >= sizeof(size_t), "overflow"); 13399dba64beSDimitry Andric auto pybuffer_obj = 13409dba64beSDimitry Andric m_py_obj.CallMethod("read", (unsigned long long)num_bytes); 13419dba64beSDimitry Andric if (!pybuffer_obj) 13429dba64beSDimitry Andric return Status(pybuffer_obj.takeError()); 13439dba64beSDimitry Andric num_bytes = 0; 13449dba64beSDimitry Andric if (pybuffer_obj.get().IsNone()) { 13459dba64beSDimitry Andric // EOF 13469dba64beSDimitry Andric num_bytes = 0; 13479dba64beSDimitry Andric return Status(); 13489dba64beSDimitry Andric } 13499dba64beSDimitry Andric auto pybuffer = PythonBuffer::Create(pybuffer_obj.get()); 13509dba64beSDimitry Andric if (!pybuffer) 13519dba64beSDimitry Andric return Status(pybuffer.takeError()); 13529dba64beSDimitry Andric memcpy(buf, pybuffer.get().get().buf, pybuffer.get().get().len); 13539dba64beSDimitry Andric num_bytes = pybuffer.get().get().len; 13549dba64beSDimitry Andric return Status(); 13559dba64beSDimitry Andric } 13569dba64beSDimitry Andric }; 13579dba64beSDimitry Andric } // namespace 13589dba64beSDimitry Andric 13599dba64beSDimitry Andric namespace { 13609dba64beSDimitry Andric class TextPythonFile : public PythonIOFile { 13619dba64beSDimitry Andric protected: 13629dba64beSDimitry Andric int m_descriptor; 13639dba64beSDimitry Andric 13649dba64beSDimitry Andric public: 13659dba64beSDimitry Andric TextPythonFile(int fd, const PythonFile &file, bool borrowed) 13669dba64beSDimitry Andric : PythonIOFile(file, borrowed), 13679dba64beSDimitry Andric m_descriptor(File::DescriptorIsValid(fd) ? fd 13689dba64beSDimitry Andric : File::kInvalidDescriptor) {} 13699dba64beSDimitry Andric 13709dba64beSDimitry Andric int GetDescriptor() const override { return m_descriptor; } 13719dba64beSDimitry Andric 13729dba64beSDimitry Andric Status Write(const void *buf, size_t &num_bytes) override { 13739dba64beSDimitry Andric GIL takeGIL; 13749dba64beSDimitry Andric auto pystring = 13759dba64beSDimitry Andric PythonString::FromUTF8(llvm::StringRef((const char *)buf, num_bytes)); 13769dba64beSDimitry Andric if (!pystring) 13779dba64beSDimitry Andric return Status(pystring.takeError()); 13789dba64beSDimitry Andric num_bytes = 0; 13799dba64beSDimitry Andric auto bytes_written = 13809dba64beSDimitry Andric As<long long>(m_py_obj.CallMethod("write", pystring.get())); 13819dba64beSDimitry Andric if (!bytes_written) 13829dba64beSDimitry Andric return Status(bytes_written.takeError()); 13839dba64beSDimitry Andric if (bytes_written.get() < 0) 13849dba64beSDimitry Andric return Status(".write() method returned a negative number!"); 13859dba64beSDimitry Andric static_assert(sizeof(long long) >= sizeof(size_t), "overflow"); 13869dba64beSDimitry Andric num_bytes = bytes_written.get(); 13879dba64beSDimitry Andric return Status(); 13889dba64beSDimitry Andric } 13899dba64beSDimitry Andric 13909dba64beSDimitry Andric Status Read(void *buf, size_t &num_bytes) override { 13919dba64beSDimitry Andric GIL takeGIL; 13929dba64beSDimitry Andric size_t num_chars = num_bytes / 6; 13939dba64beSDimitry Andric size_t orig_num_bytes = num_bytes; 13949dba64beSDimitry Andric num_bytes = 0; 13959dba64beSDimitry Andric if (orig_num_bytes < 6) { 13969dba64beSDimitry Andric return Status("can't read less than 6 bytes from a utf8 text stream"); 13979dba64beSDimitry Andric } 13989dba64beSDimitry Andric auto pystring = As<PythonString>( 13999dba64beSDimitry Andric m_py_obj.CallMethod("read", (unsigned long long)num_chars)); 14009dba64beSDimitry Andric if (!pystring) 14019dba64beSDimitry Andric return Status(pystring.takeError()); 14029dba64beSDimitry Andric if (pystring.get().IsNone()) { 14039dba64beSDimitry Andric // EOF 14049dba64beSDimitry Andric return Status(); 14059dba64beSDimitry Andric } 14069dba64beSDimitry Andric auto stringref = pystring.get().AsUTF8(); 14079dba64beSDimitry Andric if (!stringref) 14089dba64beSDimitry Andric return Status(stringref.takeError()); 14099dba64beSDimitry Andric num_bytes = stringref.get().size(); 14109dba64beSDimitry Andric memcpy(buf, stringref.get().begin(), num_bytes); 14119dba64beSDimitry Andric return Status(); 14129dba64beSDimitry Andric } 14139dba64beSDimitry Andric }; 14149dba64beSDimitry Andric } // namespace 14159dba64beSDimitry Andric 14169dba64beSDimitry Andric #endif 14179dba64beSDimitry Andric 14189dba64beSDimitry Andric llvm::Expected<FileSP> PythonFile::ConvertToFile(bool borrowed) { 14199dba64beSDimitry Andric if (!IsValid()) 14209dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 14219dba64beSDimitry Andric "invalid PythonFile"); 14229dba64beSDimitry Andric 14239dba64beSDimitry Andric int fd = PyObject_AsFileDescriptor(m_py_obj); 14249dba64beSDimitry Andric if (fd < 0) { 14259dba64beSDimitry Andric PyErr_Clear(); 14269dba64beSDimitry Andric return ConvertToFileForcingUseOfScriptingIOMethods(borrowed); 14279dba64beSDimitry Andric } 14289dba64beSDimitry Andric auto options = GetOptionsForPyObject(*this); 14299dba64beSDimitry Andric if (!options) 14309dba64beSDimitry Andric return options.takeError(); 14319dba64beSDimitry Andric 1432349cc55cSDimitry Andric File::OpenOptions rw = 1433349cc55cSDimitry Andric options.get() & (File::eOpenOptionReadOnly | File::eOpenOptionWriteOnly | 1434349cc55cSDimitry Andric File::eOpenOptionReadWrite); 1435349cc55cSDimitry Andric if (rw == File::eOpenOptionWriteOnly || rw == File::eOpenOptionReadWrite) { 14369dba64beSDimitry Andric // LLDB and python will not share I/O buffers. We should probably 14379dba64beSDimitry Andric // flush the python buffers now. 14389dba64beSDimitry Andric auto r = CallMethod("flush"); 14399dba64beSDimitry Andric if (!r) 14409dba64beSDimitry Andric return r.takeError(); 1441480093f4SDimitry Andric } 14429dba64beSDimitry Andric 14439dba64beSDimitry Andric FileSP file_sp; 14449dba64beSDimitry Andric if (borrowed) { 14459dba64beSDimitry Andric // In this case we we don't need to retain the python 14469dba64beSDimitry Andric // object at all. 14479dba64beSDimitry Andric file_sp = std::make_shared<NativeFile>(fd, options.get(), false); 14489dba64beSDimitry Andric } else { 14499dba64beSDimitry Andric file_sp = std::static_pointer_cast<File>( 14509dba64beSDimitry Andric std::make_shared<SimplePythonFile>(*this, borrowed, fd, options.get())); 14519dba64beSDimitry Andric } 14529dba64beSDimitry Andric if (!file_sp->IsValid()) 14539dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 14549dba64beSDimitry Andric "invalid File"); 14559dba64beSDimitry Andric 14569dba64beSDimitry Andric return file_sp; 14579dba64beSDimitry Andric } 14589dba64beSDimitry Andric 14599dba64beSDimitry Andric llvm::Expected<FileSP> 14609dba64beSDimitry Andric PythonFile::ConvertToFileForcingUseOfScriptingIOMethods(bool borrowed) { 14619dba64beSDimitry Andric 14629dba64beSDimitry Andric assert(!PyErr_Occurred()); 14639dba64beSDimitry Andric 14649dba64beSDimitry Andric if (!IsValid()) 14659dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 14669dba64beSDimitry Andric "invalid PythonFile"); 14679dba64beSDimitry Andric 14689dba64beSDimitry Andric #if PY_MAJOR_VERSION < 3 14699dba64beSDimitry Andric 14709dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 14719dba64beSDimitry Andric "not supported on python 2"); 14729dba64beSDimitry Andric 14739dba64beSDimitry Andric #else 14749dba64beSDimitry Andric 14759dba64beSDimitry Andric int fd = PyObject_AsFileDescriptor(m_py_obj); 14769dba64beSDimitry Andric if (fd < 0) { 14779dba64beSDimitry Andric PyErr_Clear(); 14789dba64beSDimitry Andric fd = File::kInvalidDescriptor; 14799dba64beSDimitry Andric } 14809dba64beSDimitry Andric 14819dba64beSDimitry Andric auto io_module = PythonModule::Import("io"); 14829dba64beSDimitry Andric if (!io_module) 14839dba64beSDimitry Andric return io_module.takeError(); 14849dba64beSDimitry Andric auto textIOBase = io_module.get().Get("TextIOBase"); 14859dba64beSDimitry Andric if (!textIOBase) 14869dba64beSDimitry Andric return textIOBase.takeError(); 14879dba64beSDimitry Andric auto rawIOBase = io_module.get().Get("RawIOBase"); 14889dba64beSDimitry Andric if (!rawIOBase) 14899dba64beSDimitry Andric return rawIOBase.takeError(); 14909dba64beSDimitry Andric auto bufferedIOBase = io_module.get().Get("BufferedIOBase"); 14919dba64beSDimitry Andric if (!bufferedIOBase) 14929dba64beSDimitry Andric return bufferedIOBase.takeError(); 14939dba64beSDimitry Andric 14949dba64beSDimitry Andric FileSP file_sp; 14959dba64beSDimitry Andric 14969dba64beSDimitry Andric auto isTextIO = IsInstance(textIOBase.get()); 14979dba64beSDimitry Andric if (!isTextIO) 14989dba64beSDimitry Andric return isTextIO.takeError(); 14999dba64beSDimitry Andric if (isTextIO.get()) 15009dba64beSDimitry Andric file_sp = std::static_pointer_cast<File>( 15019dba64beSDimitry Andric std::make_shared<TextPythonFile>(fd, *this, borrowed)); 15029dba64beSDimitry Andric 15039dba64beSDimitry Andric auto isRawIO = IsInstance(rawIOBase.get()); 15049dba64beSDimitry Andric if (!isRawIO) 15059dba64beSDimitry Andric return isRawIO.takeError(); 15069dba64beSDimitry Andric auto isBufferedIO = IsInstance(bufferedIOBase.get()); 15079dba64beSDimitry Andric if (!isBufferedIO) 15089dba64beSDimitry Andric return isBufferedIO.takeError(); 15099dba64beSDimitry Andric 15109dba64beSDimitry Andric if (isRawIO.get() || isBufferedIO.get()) { 15119dba64beSDimitry Andric file_sp = std::static_pointer_cast<File>( 15129dba64beSDimitry Andric std::make_shared<BinaryPythonFile>(fd, *this, borrowed)); 15139dba64beSDimitry Andric } 15149dba64beSDimitry Andric 15159dba64beSDimitry Andric if (!file_sp) 15169dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 15179dba64beSDimitry Andric "python file is neither text nor binary"); 15189dba64beSDimitry Andric 15199dba64beSDimitry Andric if (!file_sp->IsValid()) 15209dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 15219dba64beSDimitry Andric "invalid File"); 15229dba64beSDimitry Andric 15239dba64beSDimitry Andric return file_sp; 15249dba64beSDimitry Andric 15259dba64beSDimitry Andric #endif 15269dba64beSDimitry Andric } 15279dba64beSDimitry Andric 15289dba64beSDimitry Andric Expected<PythonFile> PythonFile::FromFile(File &file, const char *mode) { 15299dba64beSDimitry Andric if (!file.IsValid()) 15309dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 15319dba64beSDimitry Andric "invalid file"); 15329dba64beSDimitry Andric 15339dba64beSDimitry Andric if (auto *simple = llvm::dyn_cast<SimplePythonFile>(&file)) 15349dba64beSDimitry Andric return Retain<PythonFile>(simple->GetPythonObject()); 15359dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 15369dba64beSDimitry Andric if (auto *pythonio = llvm::dyn_cast<PythonIOFile>(&file)) 15379dba64beSDimitry Andric return Retain<PythonFile>(pythonio->GetPythonObject()); 15389dba64beSDimitry Andric #endif 15399dba64beSDimitry Andric 15409dba64beSDimitry Andric if (!mode) { 15419dba64beSDimitry Andric auto m = file.GetOpenMode(); 15429dba64beSDimitry Andric if (!m) 15439dba64beSDimitry Andric return m.takeError(); 15449dba64beSDimitry Andric mode = m.get(); 15459dba64beSDimitry Andric } 15469dba64beSDimitry Andric 15479dba64beSDimitry Andric PyObject *file_obj; 15489dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 15499dba64beSDimitry Andric file_obj = PyFile_FromFd(file.GetDescriptor(), nullptr, mode, -1, nullptr, 1550480093f4SDimitry Andric "ignore", nullptr, /*closefd=*/0); 15510b57cec5SDimitry Andric #else 1552480093f4SDimitry Andric // I'd like to pass ::fflush here if the file is writable, so that 1553480093f4SDimitry Andric // when the python side destructs the file object it will be flushed. 1554480093f4SDimitry Andric // However, this would be dangerous. It can cause fflush to be called 1555480093f4SDimitry Andric // after fclose if the python program keeps a reference to the file after 1556480093f4SDimitry Andric // the original lldb_private::File has been destructed. 1557480093f4SDimitry Andric // 1558480093f4SDimitry Andric // It's all well and good to ask a python program not to use a closed file 1559480093f4SDimitry Andric // but asking a python program to make sure objects get released in a 1560480093f4SDimitry Andric // particular order is not safe. 1561480093f4SDimitry Andric // 1562480093f4SDimitry Andric // The tradeoff here is that if a python 2 program wants to make sure this 1563480093f4SDimitry Andric // file gets flushed, they'll have to do it explicitly or wait untill the 1564480093f4SDimitry Andric // original lldb File itself gets flushed. 1565480093f4SDimitry Andric file_obj = PyFile_FromFile(file.GetStream(), py2_const_cast(""), 1566480093f4SDimitry Andric py2_const_cast(mode), [](FILE *) { return 0; }); 15670b57cec5SDimitry Andric #endif 15689dba64beSDimitry Andric 15699dba64beSDimitry Andric if (!file_obj) 15709dba64beSDimitry Andric return exception(); 15719dba64beSDimitry Andric 15729dba64beSDimitry Andric return Take<PythonFile>(file_obj); 15730b57cec5SDimitry Andric } 15740b57cec5SDimitry Andric 15759dba64beSDimitry Andric Error PythonScript::Init() { 15769dba64beSDimitry Andric if (function.IsValid()) 15779dba64beSDimitry Andric return Error::success(); 15780b57cec5SDimitry Andric 15799dba64beSDimitry Andric PythonDictionary globals(PyInitialValue::Empty); 15809dba64beSDimitry Andric auto builtins = PythonModule::BuiltinsModule(); 15819dba64beSDimitry Andric if (Error error = globals.SetItem("__builtins__", builtins)) 15829dba64beSDimitry Andric return error; 15839dba64beSDimitry Andric PyObject *o = 15849dba64beSDimitry Andric PyRun_String(script, Py_file_input, globals.get(), globals.get()); 15859dba64beSDimitry Andric if (!o) 15869dba64beSDimitry Andric return exception(); 15879dba64beSDimitry Andric Take<PythonObject>(o); 15889dba64beSDimitry Andric auto f = As<PythonCallable>(globals.GetItem("main")); 15899dba64beSDimitry Andric if (!f) 15909dba64beSDimitry Andric return f.takeError(); 15919dba64beSDimitry Andric function = std::move(f.get()); 15929dba64beSDimitry Andric 15939dba64beSDimitry Andric return Error::success(); 15940b57cec5SDimitry Andric } 15950b57cec5SDimitry Andric 15969dba64beSDimitry Andric llvm::Expected<PythonObject> 15979dba64beSDimitry Andric python::runStringOneLine(const llvm::Twine &string, 15989dba64beSDimitry Andric const PythonDictionary &globals, 15999dba64beSDimitry Andric const PythonDictionary &locals) { 16009dba64beSDimitry Andric if (!globals.IsValid() || !locals.IsValid()) 16019dba64beSDimitry Andric return nullDeref(); 16020b57cec5SDimitry Andric 16039dba64beSDimitry Andric PyObject *code = 16049dba64beSDimitry Andric Py_CompileString(NullTerminated(string), "<string>", Py_eval_input); 16059dba64beSDimitry Andric if (!code) { 16069dba64beSDimitry Andric PyErr_Clear(); 16079dba64beSDimitry Andric code = 16089dba64beSDimitry Andric Py_CompileString(NullTerminated(string), "<string>", Py_single_input); 16099dba64beSDimitry Andric } 16109dba64beSDimitry Andric if (!code) 16119dba64beSDimitry Andric return exception(); 16129dba64beSDimitry Andric auto code_ref = Take<PythonObject>(code); 16139dba64beSDimitry Andric 16149dba64beSDimitry Andric #if PY_MAJOR_VERSION < 3 16159dba64beSDimitry Andric PyObject *result = 16169dba64beSDimitry Andric PyEval_EvalCode((PyCodeObject *)code, globals.get(), locals.get()); 16179dba64beSDimitry Andric #else 16189dba64beSDimitry Andric PyObject *result = PyEval_EvalCode(code, globals.get(), locals.get()); 16199dba64beSDimitry Andric #endif 16209dba64beSDimitry Andric 16219dba64beSDimitry Andric if (!result) 16229dba64beSDimitry Andric return exception(); 16239dba64beSDimitry Andric 16249dba64beSDimitry Andric return Take<PythonObject>(result); 16259dba64beSDimitry Andric } 16269dba64beSDimitry Andric 16279dba64beSDimitry Andric llvm::Expected<PythonObject> 16289dba64beSDimitry Andric python::runStringMultiLine(const llvm::Twine &string, 16299dba64beSDimitry Andric const PythonDictionary &globals, 16309dba64beSDimitry Andric const PythonDictionary &locals) { 16319dba64beSDimitry Andric if (!globals.IsValid() || !locals.IsValid()) 16329dba64beSDimitry Andric return nullDeref(); 16339dba64beSDimitry Andric PyObject *result = PyRun_String(NullTerminated(string), Py_file_input, 16349dba64beSDimitry Andric globals.get(), locals.get()); 16359dba64beSDimitry Andric if (!result) 16369dba64beSDimitry Andric return exception(); 16379dba64beSDimitry Andric return Take<PythonObject>(result); 16380b57cec5SDimitry Andric } 16390b57cec5SDimitry Andric 16400b57cec5SDimitry Andric #endif 1641