xref: /freebsd-src/contrib/llvm-project/lldb/source/Plugins/ScriptInterpreter/Python/PythonDataObjects.cpp (revision 5ffd83dbcc34f10e07f6d3e968ae6365869615f4)
1*5ffd83dbSDimitry Andric //===-- PythonDataObjects.cpp ---------------------------------------------===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric 
9480093f4SDimitry Andric #include "lldb/Host/Config.h"
100b57cec5SDimitry Andric 
11480093f4SDimitry Andric #if LLDB_ENABLE_PYTHON
120b57cec5SDimitry Andric 
130b57cec5SDimitry Andric #include "PythonDataObjects.h"
140b57cec5SDimitry Andric #include "ScriptInterpreterPython.h"
150b57cec5SDimitry Andric 
160b57cec5SDimitry Andric #include "lldb/Host/File.h"
170b57cec5SDimitry Andric #include "lldb/Host/FileSystem.h"
180b57cec5SDimitry Andric #include "lldb/Interpreter/ScriptInterpreter.h"
199dba64beSDimitry Andric #include "lldb/Utility/Log.h"
200b57cec5SDimitry Andric #include "lldb/Utility/Stream.h"
210b57cec5SDimitry Andric 
220b57cec5SDimitry Andric #include "llvm/ADT/StringSwitch.h"
239dba64beSDimitry Andric #include "llvm/Support/Casting.h"
240b57cec5SDimitry Andric #include "llvm/Support/ConvertUTF.h"
250b57cec5SDimitry Andric #include "llvm/Support/Errno.h"
260b57cec5SDimitry Andric 
270b57cec5SDimitry Andric #include <stdio.h>
280b57cec5SDimitry Andric 
290b57cec5SDimitry Andric using namespace lldb_private;
300b57cec5SDimitry Andric using namespace lldb;
319dba64beSDimitry Andric using namespace lldb_private::python;
329dba64beSDimitry Andric using llvm::cantFail;
339dba64beSDimitry Andric using llvm::Error;
349dba64beSDimitry Andric using llvm::Expected;
359dba64beSDimitry Andric using llvm::Twine;
360b57cec5SDimitry Andric 
379dba64beSDimitry Andric template <> Expected<bool> python::As<bool>(Expected<PythonObject> &&obj) {
389dba64beSDimitry Andric   if (!obj)
399dba64beSDimitry Andric     return obj.takeError();
409dba64beSDimitry Andric   return obj.get().IsTrue();
419dba64beSDimitry Andric }
429dba64beSDimitry Andric 
439dba64beSDimitry Andric template <>
449dba64beSDimitry Andric Expected<long long> python::As<long long>(Expected<PythonObject> &&obj) {
459dba64beSDimitry Andric   if (!obj)
469dba64beSDimitry Andric     return obj.takeError();
47*5ffd83dbSDimitry Andric   return obj->AsLongLong();
48*5ffd83dbSDimitry Andric }
49*5ffd83dbSDimitry Andric 
50*5ffd83dbSDimitry Andric template <>
51*5ffd83dbSDimitry Andric Expected<unsigned long long>
52*5ffd83dbSDimitry Andric python::As<unsigned long long>(Expected<PythonObject> &&obj) {
53*5ffd83dbSDimitry Andric   if (!obj)
54*5ffd83dbSDimitry Andric     return obj.takeError();
55*5ffd83dbSDimitry Andric   return obj->AsUnsignedLongLong();
569dba64beSDimitry Andric }
579dba64beSDimitry Andric 
589dba64beSDimitry Andric template <>
599dba64beSDimitry Andric Expected<std::string> python::As<std::string>(Expected<PythonObject> &&obj) {
609dba64beSDimitry Andric   if (!obj)
619dba64beSDimitry Andric     return obj.takeError();
629dba64beSDimitry Andric   PyObject *str_obj = PyObject_Str(obj.get().get());
639dba64beSDimitry Andric   if (!obj)
649dba64beSDimitry Andric     return llvm::make_error<PythonException>();
659dba64beSDimitry Andric   auto str = Take<PythonString>(str_obj);
669dba64beSDimitry Andric   auto utf8 = str.AsUTF8();
679dba64beSDimitry Andric   if (!utf8)
689dba64beSDimitry Andric     return utf8.takeError();
69*5ffd83dbSDimitry Andric   return std::string(utf8.get());
70*5ffd83dbSDimitry Andric }
71*5ffd83dbSDimitry Andric 
72*5ffd83dbSDimitry Andric Expected<long long> PythonObject::AsLongLong() const {
73*5ffd83dbSDimitry Andric   if (!m_py_obj)
74*5ffd83dbSDimitry Andric     return nullDeref();
75*5ffd83dbSDimitry Andric #if PY_MAJOR_VERSION < 3
76*5ffd83dbSDimitry Andric   if (!PyLong_Check(m_py_obj)) {
77*5ffd83dbSDimitry Andric     PythonInteger i(PyRefType::Borrowed, m_py_obj);
78*5ffd83dbSDimitry Andric     return i.AsLongLong();
79*5ffd83dbSDimitry Andric   }
80*5ffd83dbSDimitry Andric #endif
81*5ffd83dbSDimitry Andric   assert(!PyErr_Occurred());
82*5ffd83dbSDimitry Andric   long long r = PyLong_AsLongLong(m_py_obj);
83*5ffd83dbSDimitry Andric   if (PyErr_Occurred())
84*5ffd83dbSDimitry Andric     return exception();
85*5ffd83dbSDimitry Andric   return r;
86*5ffd83dbSDimitry Andric }
87*5ffd83dbSDimitry Andric 
88*5ffd83dbSDimitry Andric Expected<long long> PythonObject::AsUnsignedLongLong() const {
89*5ffd83dbSDimitry Andric   if (!m_py_obj)
90*5ffd83dbSDimitry Andric     return nullDeref();
91*5ffd83dbSDimitry Andric #if PY_MAJOR_VERSION < 3
92*5ffd83dbSDimitry Andric   if (!PyLong_Check(m_py_obj)) {
93*5ffd83dbSDimitry Andric     PythonInteger i(PyRefType::Borrowed, m_py_obj);
94*5ffd83dbSDimitry Andric     return i.AsUnsignedLongLong();
95*5ffd83dbSDimitry Andric   }
96*5ffd83dbSDimitry Andric #endif
97*5ffd83dbSDimitry Andric   assert(!PyErr_Occurred());
98*5ffd83dbSDimitry Andric   long long r = PyLong_AsUnsignedLongLong(m_py_obj);
99*5ffd83dbSDimitry Andric   if (PyErr_Occurred())
100*5ffd83dbSDimitry Andric     return exception();
101*5ffd83dbSDimitry Andric   return r;
102*5ffd83dbSDimitry Andric }
103*5ffd83dbSDimitry Andric 
104*5ffd83dbSDimitry Andric // wraps on overflow, instead of raising an error.
105*5ffd83dbSDimitry Andric Expected<unsigned long long> PythonObject::AsModuloUnsignedLongLong() const {
106*5ffd83dbSDimitry Andric   if (!m_py_obj)
107*5ffd83dbSDimitry Andric     return nullDeref();
108*5ffd83dbSDimitry Andric #if PY_MAJOR_VERSION < 3
109*5ffd83dbSDimitry Andric   if (!PyLong_Check(m_py_obj)) {
110*5ffd83dbSDimitry Andric     PythonInteger i(PyRefType::Borrowed, m_py_obj);
111*5ffd83dbSDimitry Andric     return i.AsModuloUnsignedLongLong();
112*5ffd83dbSDimitry Andric   }
113*5ffd83dbSDimitry Andric #endif
114*5ffd83dbSDimitry Andric   assert(!PyErr_Occurred());
115*5ffd83dbSDimitry Andric   unsigned long long r = PyLong_AsUnsignedLongLongMask(m_py_obj);
116*5ffd83dbSDimitry Andric   if (PyErr_Occurred())
117*5ffd83dbSDimitry Andric     return exception();
118*5ffd83dbSDimitry Andric   return r;
1199dba64beSDimitry Andric }
1209dba64beSDimitry Andric 
1219dba64beSDimitry Andric void StructuredPythonObject::Serialize(llvm::json::OStream &s) const {
1229dba64beSDimitry Andric   s.value(llvm::formatv("Python Obj: {0:X}", GetValue()).str());
1230b57cec5SDimitry Andric }
1240b57cec5SDimitry Andric 
1250b57cec5SDimitry Andric // PythonObject
1260b57cec5SDimitry Andric 
1270b57cec5SDimitry Andric void PythonObject::Dump(Stream &strm) const {
1280b57cec5SDimitry Andric   if (m_py_obj) {
1290b57cec5SDimitry Andric     FILE *file = llvm::sys::RetryAfterSignal(nullptr, ::tmpfile);
1300b57cec5SDimitry Andric     if (file) {
1310b57cec5SDimitry Andric       ::PyObject_Print(m_py_obj, file, 0);
1320b57cec5SDimitry Andric       const long length = ftell(file);
1330b57cec5SDimitry Andric       if (length) {
1340b57cec5SDimitry Andric         ::rewind(file);
1350b57cec5SDimitry Andric         std::vector<char> file_contents(length, '\0');
1360b57cec5SDimitry Andric         const size_t length_read =
1370b57cec5SDimitry Andric             ::fread(file_contents.data(), 1, file_contents.size(), file);
1380b57cec5SDimitry Andric         if (length_read > 0)
1390b57cec5SDimitry Andric           strm.Write(file_contents.data(), length_read);
1400b57cec5SDimitry Andric       }
1410b57cec5SDimitry Andric       ::fclose(file);
1420b57cec5SDimitry Andric     }
1430b57cec5SDimitry Andric   } else
1440b57cec5SDimitry Andric     strm.PutCString("NULL");
1450b57cec5SDimitry Andric }
1460b57cec5SDimitry Andric 
1470b57cec5SDimitry Andric PyObjectType PythonObject::GetObjectType() const {
1480b57cec5SDimitry Andric   if (!IsAllocated())
1490b57cec5SDimitry Andric     return PyObjectType::None;
1500b57cec5SDimitry Andric 
1510b57cec5SDimitry Andric   if (PythonModule::Check(m_py_obj))
1520b57cec5SDimitry Andric     return PyObjectType::Module;
1530b57cec5SDimitry Andric   if (PythonList::Check(m_py_obj))
1540b57cec5SDimitry Andric     return PyObjectType::List;
1550b57cec5SDimitry Andric   if (PythonTuple::Check(m_py_obj))
1560b57cec5SDimitry Andric     return PyObjectType::Tuple;
1570b57cec5SDimitry Andric   if (PythonDictionary::Check(m_py_obj))
1580b57cec5SDimitry Andric     return PyObjectType::Dictionary;
1590b57cec5SDimitry Andric   if (PythonString::Check(m_py_obj))
1600b57cec5SDimitry Andric     return PyObjectType::String;
1610b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3
1620b57cec5SDimitry Andric   if (PythonBytes::Check(m_py_obj))
1630b57cec5SDimitry Andric     return PyObjectType::Bytes;
1640b57cec5SDimitry Andric #endif
1650b57cec5SDimitry Andric   if (PythonByteArray::Check(m_py_obj))
1660b57cec5SDimitry Andric     return PyObjectType::ByteArray;
1670b57cec5SDimitry Andric   if (PythonBoolean::Check(m_py_obj))
1680b57cec5SDimitry Andric     return PyObjectType::Boolean;
1690b57cec5SDimitry Andric   if (PythonInteger::Check(m_py_obj))
1700b57cec5SDimitry Andric     return PyObjectType::Integer;
1710b57cec5SDimitry Andric   if (PythonFile::Check(m_py_obj))
1720b57cec5SDimitry Andric     return PyObjectType::File;
1730b57cec5SDimitry Andric   if (PythonCallable::Check(m_py_obj))
1740b57cec5SDimitry Andric     return PyObjectType::Callable;
1750b57cec5SDimitry Andric   return PyObjectType::Unknown;
1760b57cec5SDimitry Andric }
1770b57cec5SDimitry Andric 
1780b57cec5SDimitry Andric PythonString PythonObject::Repr() const {
1790b57cec5SDimitry Andric   if (!m_py_obj)
1800b57cec5SDimitry Andric     return PythonString();
1810b57cec5SDimitry Andric   PyObject *repr = PyObject_Repr(m_py_obj);
1820b57cec5SDimitry Andric   if (!repr)
1830b57cec5SDimitry Andric     return PythonString();
1840b57cec5SDimitry Andric   return PythonString(PyRefType::Owned, repr);
1850b57cec5SDimitry Andric }
1860b57cec5SDimitry Andric 
1870b57cec5SDimitry Andric PythonString PythonObject::Str() const {
1880b57cec5SDimitry Andric   if (!m_py_obj)
1890b57cec5SDimitry Andric     return PythonString();
1900b57cec5SDimitry Andric   PyObject *str = PyObject_Str(m_py_obj);
1910b57cec5SDimitry Andric   if (!str)
1920b57cec5SDimitry Andric     return PythonString();
1930b57cec5SDimitry Andric   return PythonString(PyRefType::Owned, str);
1940b57cec5SDimitry Andric }
1950b57cec5SDimitry Andric 
1960b57cec5SDimitry Andric PythonObject
1970b57cec5SDimitry Andric PythonObject::ResolveNameWithDictionary(llvm::StringRef name,
1980b57cec5SDimitry Andric                                         const PythonDictionary &dict) {
1990b57cec5SDimitry Andric   size_t dot_pos = name.find('.');
2000b57cec5SDimitry Andric   llvm::StringRef piece = name.substr(0, dot_pos);
2010b57cec5SDimitry Andric   PythonObject result = dict.GetItemForKey(PythonString(piece));
2020b57cec5SDimitry Andric   if (dot_pos == llvm::StringRef::npos) {
2030b57cec5SDimitry Andric     // There was no dot, we're done.
2040b57cec5SDimitry Andric     return result;
2050b57cec5SDimitry Andric   }
2060b57cec5SDimitry Andric 
2070b57cec5SDimitry Andric   // There was a dot.  The remaining portion of the name should be looked up in
2080b57cec5SDimitry Andric   // the context of the object that was found in the dictionary.
2090b57cec5SDimitry Andric   return result.ResolveName(name.substr(dot_pos + 1));
2100b57cec5SDimitry Andric }
2110b57cec5SDimitry Andric 
2120b57cec5SDimitry Andric PythonObject PythonObject::ResolveName(llvm::StringRef name) const {
2130b57cec5SDimitry Andric   // Resolve the name in the context of the specified object.  If, for example,
2140b57cec5SDimitry Andric   // `this` refers to a PyModule, then this will look for `name` in this
2150b57cec5SDimitry Andric   // module.  If `this` refers to a PyType, then it will resolve `name` as an
2160b57cec5SDimitry Andric   // attribute of that type.  If `this` refers to an instance of an object,
2170b57cec5SDimitry Andric   // then it will resolve `name` as the value of the specified field.
2180b57cec5SDimitry Andric   //
2190b57cec5SDimitry Andric   // This function handles dotted names so that, for example, if `m_py_obj`
2200b57cec5SDimitry Andric   // refers to the `sys` module, and `name` == "path.append", then it will find
2210b57cec5SDimitry Andric   // the function `sys.path.append`.
2220b57cec5SDimitry Andric 
2230b57cec5SDimitry Andric   size_t dot_pos = name.find('.');
2240b57cec5SDimitry Andric   if (dot_pos == llvm::StringRef::npos) {
2250b57cec5SDimitry Andric     // No dots in the name, we should be able to find the value immediately as
2260b57cec5SDimitry Andric     // an attribute of `m_py_obj`.
2270b57cec5SDimitry Andric     return GetAttributeValue(name);
2280b57cec5SDimitry Andric   }
2290b57cec5SDimitry Andric 
2300b57cec5SDimitry Andric   // Look up the first piece of the name, and resolve the rest as a child of
2310b57cec5SDimitry Andric   // that.
2320b57cec5SDimitry Andric   PythonObject parent = ResolveName(name.substr(0, dot_pos));
2330b57cec5SDimitry Andric   if (!parent.IsAllocated())
2340b57cec5SDimitry Andric     return PythonObject();
2350b57cec5SDimitry Andric 
2360b57cec5SDimitry Andric   // Tail recursion.. should be optimized by the compiler
2370b57cec5SDimitry Andric   return parent.ResolveName(name.substr(dot_pos + 1));
2380b57cec5SDimitry Andric }
2390b57cec5SDimitry Andric 
2400b57cec5SDimitry Andric bool PythonObject::HasAttribute(llvm::StringRef attr) const {
2410b57cec5SDimitry Andric   if (!IsValid())
2420b57cec5SDimitry Andric     return false;
2430b57cec5SDimitry Andric   PythonString py_attr(attr);
2440b57cec5SDimitry Andric   return !!PyObject_HasAttr(m_py_obj, py_attr.get());
2450b57cec5SDimitry Andric }
2460b57cec5SDimitry Andric 
2470b57cec5SDimitry Andric PythonObject PythonObject::GetAttributeValue(llvm::StringRef attr) const {
2480b57cec5SDimitry Andric   if (!IsValid())
2490b57cec5SDimitry Andric     return PythonObject();
2500b57cec5SDimitry Andric 
2510b57cec5SDimitry Andric   PythonString py_attr(attr);
2520b57cec5SDimitry Andric   if (!PyObject_HasAttr(m_py_obj, py_attr.get()))
2530b57cec5SDimitry Andric     return PythonObject();
2540b57cec5SDimitry Andric 
2550b57cec5SDimitry Andric   return PythonObject(PyRefType::Owned,
2560b57cec5SDimitry Andric                       PyObject_GetAttr(m_py_obj, py_attr.get()));
2570b57cec5SDimitry Andric }
2580b57cec5SDimitry Andric 
2590b57cec5SDimitry Andric StructuredData::ObjectSP PythonObject::CreateStructuredObject() const {
2600b57cec5SDimitry Andric   switch (GetObjectType()) {
2610b57cec5SDimitry Andric   case PyObjectType::Dictionary:
2620b57cec5SDimitry Andric     return PythonDictionary(PyRefType::Borrowed, m_py_obj)
2630b57cec5SDimitry Andric         .CreateStructuredDictionary();
2640b57cec5SDimitry Andric   case PyObjectType::Boolean:
2650b57cec5SDimitry Andric     return PythonBoolean(PyRefType::Borrowed, m_py_obj)
2660b57cec5SDimitry Andric         .CreateStructuredBoolean();
2670b57cec5SDimitry Andric   case PyObjectType::Integer:
2680b57cec5SDimitry Andric     return PythonInteger(PyRefType::Borrowed, m_py_obj)
2690b57cec5SDimitry Andric         .CreateStructuredInteger();
2700b57cec5SDimitry Andric   case PyObjectType::List:
2710b57cec5SDimitry Andric     return PythonList(PyRefType::Borrowed, m_py_obj).CreateStructuredArray();
2720b57cec5SDimitry Andric   case PyObjectType::String:
2730b57cec5SDimitry Andric     return PythonString(PyRefType::Borrowed, m_py_obj).CreateStructuredString();
2740b57cec5SDimitry Andric   case PyObjectType::Bytes:
2750b57cec5SDimitry Andric     return PythonBytes(PyRefType::Borrowed, m_py_obj).CreateStructuredString();
2760b57cec5SDimitry Andric   case PyObjectType::ByteArray:
2770b57cec5SDimitry Andric     return PythonByteArray(PyRefType::Borrowed, m_py_obj)
2780b57cec5SDimitry Andric         .CreateStructuredString();
2790b57cec5SDimitry Andric   case PyObjectType::None:
2800b57cec5SDimitry Andric     return StructuredData::ObjectSP();
2810b57cec5SDimitry Andric   default:
2820b57cec5SDimitry Andric     return StructuredData::ObjectSP(new StructuredPythonObject(m_py_obj));
2830b57cec5SDimitry Andric   }
2840b57cec5SDimitry Andric }
2850b57cec5SDimitry Andric 
2860b57cec5SDimitry Andric // PythonString
2870b57cec5SDimitry Andric 
2889dba64beSDimitry Andric PythonBytes::PythonBytes(llvm::ArrayRef<uint8_t> bytes) { SetBytes(bytes); }
2890b57cec5SDimitry Andric 
2909dba64beSDimitry Andric PythonBytes::PythonBytes(const uint8_t *bytes, size_t length) {
2910b57cec5SDimitry Andric   SetBytes(llvm::ArrayRef<uint8_t>(bytes, length));
2920b57cec5SDimitry Andric }
2930b57cec5SDimitry Andric 
2940b57cec5SDimitry Andric bool PythonBytes::Check(PyObject *py_obj) {
2950b57cec5SDimitry Andric   if (!py_obj)
2960b57cec5SDimitry Andric     return false;
2970b57cec5SDimitry Andric   return PyBytes_Check(py_obj);
2980b57cec5SDimitry Andric }
2990b57cec5SDimitry Andric 
3000b57cec5SDimitry Andric llvm::ArrayRef<uint8_t> PythonBytes::GetBytes() const {
3010b57cec5SDimitry Andric   if (!IsValid())
3020b57cec5SDimitry Andric     return llvm::ArrayRef<uint8_t>();
3030b57cec5SDimitry Andric 
3040b57cec5SDimitry Andric   Py_ssize_t size;
3050b57cec5SDimitry Andric   char *c;
3060b57cec5SDimitry Andric 
3070b57cec5SDimitry Andric   PyBytes_AsStringAndSize(m_py_obj, &c, &size);
3080b57cec5SDimitry Andric   return llvm::ArrayRef<uint8_t>(reinterpret_cast<uint8_t *>(c), size);
3090b57cec5SDimitry Andric }
3100b57cec5SDimitry Andric 
3110b57cec5SDimitry Andric size_t PythonBytes::GetSize() const {
3120b57cec5SDimitry Andric   if (!IsValid())
3130b57cec5SDimitry Andric     return 0;
3140b57cec5SDimitry Andric   return PyBytes_Size(m_py_obj);
3150b57cec5SDimitry Andric }
3160b57cec5SDimitry Andric 
3170b57cec5SDimitry Andric void PythonBytes::SetBytes(llvm::ArrayRef<uint8_t> bytes) {
3180b57cec5SDimitry Andric   const char *data = reinterpret_cast<const char *>(bytes.data());
3199dba64beSDimitry Andric   *this = Take<PythonBytes>(PyBytes_FromStringAndSize(data, bytes.size()));
3200b57cec5SDimitry Andric }
3210b57cec5SDimitry Andric 
3220b57cec5SDimitry Andric StructuredData::StringSP PythonBytes::CreateStructuredString() const {
3230b57cec5SDimitry Andric   StructuredData::StringSP result(new StructuredData::String);
3240b57cec5SDimitry Andric   Py_ssize_t size;
3250b57cec5SDimitry Andric   char *c;
3260b57cec5SDimitry Andric   PyBytes_AsStringAndSize(m_py_obj, &c, &size);
3270b57cec5SDimitry Andric   result->SetValue(std::string(c, size));
3280b57cec5SDimitry Andric   return result;
3290b57cec5SDimitry Andric }
3300b57cec5SDimitry Andric 
3310b57cec5SDimitry Andric PythonByteArray::PythonByteArray(llvm::ArrayRef<uint8_t> bytes)
3320b57cec5SDimitry Andric     : PythonByteArray(bytes.data(), bytes.size()) {}
3330b57cec5SDimitry Andric 
3340b57cec5SDimitry Andric PythonByteArray::PythonByteArray(const uint8_t *bytes, size_t length) {
3350b57cec5SDimitry Andric   const char *str = reinterpret_cast<const char *>(bytes);
3369dba64beSDimitry Andric   *this = Take<PythonByteArray>(PyByteArray_FromStringAndSize(str, length));
3370b57cec5SDimitry Andric }
3380b57cec5SDimitry Andric 
3390b57cec5SDimitry Andric bool PythonByteArray::Check(PyObject *py_obj) {
3400b57cec5SDimitry Andric   if (!py_obj)
3410b57cec5SDimitry Andric     return false;
3420b57cec5SDimitry Andric   return PyByteArray_Check(py_obj);
3430b57cec5SDimitry Andric }
3440b57cec5SDimitry Andric 
3450b57cec5SDimitry Andric llvm::ArrayRef<uint8_t> PythonByteArray::GetBytes() const {
3460b57cec5SDimitry Andric   if (!IsValid())
3470b57cec5SDimitry Andric     return llvm::ArrayRef<uint8_t>();
3480b57cec5SDimitry Andric 
3490b57cec5SDimitry Andric   char *c = PyByteArray_AsString(m_py_obj);
3500b57cec5SDimitry Andric   size_t size = GetSize();
3510b57cec5SDimitry Andric   return llvm::ArrayRef<uint8_t>(reinterpret_cast<uint8_t *>(c), size);
3520b57cec5SDimitry Andric }
3530b57cec5SDimitry Andric 
3540b57cec5SDimitry Andric size_t PythonByteArray::GetSize() const {
3550b57cec5SDimitry Andric   if (!IsValid())
3560b57cec5SDimitry Andric     return 0;
3570b57cec5SDimitry Andric 
3580b57cec5SDimitry Andric   return PyByteArray_Size(m_py_obj);
3590b57cec5SDimitry Andric }
3600b57cec5SDimitry Andric 
3610b57cec5SDimitry Andric StructuredData::StringSP PythonByteArray::CreateStructuredString() const {
3620b57cec5SDimitry Andric   StructuredData::StringSP result(new StructuredData::String);
3630b57cec5SDimitry Andric   llvm::ArrayRef<uint8_t> bytes = GetBytes();
3640b57cec5SDimitry Andric   const char *str = reinterpret_cast<const char *>(bytes.data());
3650b57cec5SDimitry Andric   result->SetValue(std::string(str, bytes.size()));
3660b57cec5SDimitry Andric   return result;
3670b57cec5SDimitry Andric }
3680b57cec5SDimitry Andric 
3690b57cec5SDimitry Andric // PythonString
3700b57cec5SDimitry Andric 
3719dba64beSDimitry Andric Expected<PythonString> PythonString::FromUTF8(llvm::StringRef string) {
3729dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3
3739dba64beSDimitry Andric   PyObject *str = PyUnicode_FromStringAndSize(string.data(), string.size());
3749dba64beSDimitry Andric #else
3759dba64beSDimitry Andric   PyObject *str = PyString_FromStringAndSize(string.data(), string.size());
3769dba64beSDimitry Andric #endif
3779dba64beSDimitry Andric   if (!str)
3789dba64beSDimitry Andric     return llvm::make_error<PythonException>();
3799dba64beSDimitry Andric   return Take<PythonString>(str);
3800b57cec5SDimitry Andric }
3810b57cec5SDimitry Andric 
3829dba64beSDimitry Andric PythonString::PythonString(llvm::StringRef string) { SetString(string); }
3830b57cec5SDimitry Andric 
3840b57cec5SDimitry Andric bool PythonString::Check(PyObject *py_obj) {
3850b57cec5SDimitry Andric   if (!py_obj)
3860b57cec5SDimitry Andric     return false;
3870b57cec5SDimitry Andric 
3880b57cec5SDimitry Andric   if (PyUnicode_Check(py_obj))
3890b57cec5SDimitry Andric     return true;
3900b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3
3910b57cec5SDimitry Andric   if (PyString_Check(py_obj))
3920b57cec5SDimitry Andric     return true;
3930b57cec5SDimitry Andric #endif
3940b57cec5SDimitry Andric   return false;
3950b57cec5SDimitry Andric }
3960b57cec5SDimitry Andric 
3979dba64beSDimitry Andric void PythonString::Convert(PyRefType &type, PyObject *&py_obj) {
3980b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3
3990b57cec5SDimitry Andric   // In Python 2, Don't store PyUnicode objects directly, because we need
4000b57cec5SDimitry Andric   // access to their underlying character buffers which Python 2 doesn't
4010b57cec5SDimitry Andric   // provide.
4029dba64beSDimitry Andric   if (PyUnicode_Check(py_obj)) {
4039dba64beSDimitry Andric     PyObject *s = PyUnicode_AsUTF8String(py_obj);
4049dba64beSDimitry Andric     if (s == nullptr) {
4059dba64beSDimitry Andric       PyErr_Clear();
4069dba64beSDimitry Andric       if (type == PyRefType::Owned)
4079dba64beSDimitry Andric         Py_DECREF(py_obj);
4089dba64beSDimitry Andric       return;
4099dba64beSDimitry Andric     }
4109dba64beSDimitry Andric     if (type == PyRefType::Owned)
4119dba64beSDimitry Andric       Py_DECREF(py_obj);
4129dba64beSDimitry Andric     else
4139dba64beSDimitry Andric       type = PyRefType::Owned;
4149dba64beSDimitry Andric     py_obj = s;
4159dba64beSDimitry Andric   }
4160b57cec5SDimitry Andric #endif
4170b57cec5SDimitry Andric }
4180b57cec5SDimitry Andric 
4190b57cec5SDimitry Andric llvm::StringRef PythonString::GetString() const {
4209dba64beSDimitry Andric   auto s = AsUTF8();
4219dba64beSDimitry Andric   if (!s) {
4229dba64beSDimitry Andric     llvm::consumeError(s.takeError());
4239dba64beSDimitry Andric     return llvm::StringRef("");
4249dba64beSDimitry Andric   }
4259dba64beSDimitry Andric   return s.get();
4269dba64beSDimitry Andric }
4279dba64beSDimitry Andric 
4289dba64beSDimitry Andric Expected<llvm::StringRef> PythonString::AsUTF8() const {
4290b57cec5SDimitry Andric   if (!IsValid())
4309dba64beSDimitry Andric     return nullDeref();
4310b57cec5SDimitry Andric 
4320b57cec5SDimitry Andric   Py_ssize_t size;
4330b57cec5SDimitry Andric   const char *data;
4340b57cec5SDimitry Andric 
4350b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3
4360b57cec5SDimitry Andric   data = PyUnicode_AsUTF8AndSize(m_py_obj, &size);
4370b57cec5SDimitry Andric #else
4389dba64beSDimitry Andric   char *c = NULL;
4399dba64beSDimitry Andric   int r = PyString_AsStringAndSize(m_py_obj, &c, &size);
4409dba64beSDimitry Andric   if (r < 0)
4419dba64beSDimitry Andric     c = NULL;
4420b57cec5SDimitry Andric   data = c;
4430b57cec5SDimitry Andric #endif
4449dba64beSDimitry Andric 
4459dba64beSDimitry Andric   if (!data)
4469dba64beSDimitry Andric     return exception();
4479dba64beSDimitry Andric 
4480b57cec5SDimitry Andric   return llvm::StringRef(data, size);
4490b57cec5SDimitry Andric }
4500b57cec5SDimitry Andric 
4510b57cec5SDimitry Andric size_t PythonString::GetSize() const {
4520b57cec5SDimitry Andric   if (IsValid()) {
4530b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3
4540b57cec5SDimitry Andric     return PyUnicode_GetSize(m_py_obj);
4550b57cec5SDimitry Andric #else
4560b57cec5SDimitry Andric     return PyString_Size(m_py_obj);
4570b57cec5SDimitry Andric #endif
4580b57cec5SDimitry Andric   }
4590b57cec5SDimitry Andric   return 0;
4600b57cec5SDimitry Andric }
4610b57cec5SDimitry Andric 
4620b57cec5SDimitry Andric void PythonString::SetString(llvm::StringRef string) {
4639dba64beSDimitry Andric   auto s = FromUTF8(string);
4649dba64beSDimitry Andric   if (!s) {
4659dba64beSDimitry Andric     llvm::consumeError(s.takeError());
4669dba64beSDimitry Andric     Reset();
4679dba64beSDimitry Andric   } else {
4689dba64beSDimitry Andric     *this = std::move(s.get());
4699dba64beSDimitry Andric   }
4700b57cec5SDimitry Andric }
4710b57cec5SDimitry Andric 
4720b57cec5SDimitry Andric StructuredData::StringSP PythonString::CreateStructuredString() const {
4730b57cec5SDimitry Andric   StructuredData::StringSP result(new StructuredData::String);
4740b57cec5SDimitry Andric   result->SetValue(GetString());
4750b57cec5SDimitry Andric   return result;
4760b57cec5SDimitry Andric }
4770b57cec5SDimitry Andric 
4780b57cec5SDimitry Andric // PythonInteger
4790b57cec5SDimitry Andric 
4809dba64beSDimitry Andric PythonInteger::PythonInteger(int64_t value) { SetInteger(value); }
4810b57cec5SDimitry Andric 
4820b57cec5SDimitry Andric bool PythonInteger::Check(PyObject *py_obj) {
4830b57cec5SDimitry Andric   if (!py_obj)
4840b57cec5SDimitry Andric     return false;
4850b57cec5SDimitry Andric 
4860b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3
4870b57cec5SDimitry Andric   // Python 3 does not have PyInt_Check.  There is only one type of integral
4880b57cec5SDimitry Andric   // value, long.
4890b57cec5SDimitry Andric   return PyLong_Check(py_obj);
4900b57cec5SDimitry Andric #else
4910b57cec5SDimitry Andric   return PyLong_Check(py_obj) || PyInt_Check(py_obj);
4920b57cec5SDimitry Andric #endif
4930b57cec5SDimitry Andric }
4940b57cec5SDimitry Andric 
4959dba64beSDimitry Andric void PythonInteger::Convert(PyRefType &type, PyObject *&py_obj) {
4960b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3
4970b57cec5SDimitry Andric   // Always store this as a PyLong, which makes interoperability between Python
4980b57cec5SDimitry Andric   // 2.x and Python 3.x easier.  This is only necessary in 2.x, since 3.x
4990b57cec5SDimitry Andric   // doesn't even have a PyInt.
5000b57cec5SDimitry Andric   if (PyInt_Check(py_obj)) {
5010b57cec5SDimitry Andric     // Since we converted the original object to a different type, the new
5020b57cec5SDimitry Andric     // object is an owned object regardless of the ownership semantics
5030b57cec5SDimitry Andric     // requested by the user.
5049dba64beSDimitry Andric     long long value = PyInt_AsLong(py_obj);
5059dba64beSDimitry Andric     PyObject *l = nullptr;
5069dba64beSDimitry Andric     if (!PyErr_Occurred())
5079dba64beSDimitry Andric       l = PyLong_FromLongLong(value);
5089dba64beSDimitry Andric     if (l == nullptr) {
5099dba64beSDimitry Andric       PyErr_Clear();
5109dba64beSDimitry Andric       if (type == PyRefType::Owned)
5119dba64beSDimitry Andric         Py_DECREF(py_obj);
5129dba64beSDimitry Andric       return;
5139dba64beSDimitry Andric     }
5149dba64beSDimitry Andric     if (type == PyRefType::Owned)
5159dba64beSDimitry Andric       Py_DECREF(py_obj);
5169dba64beSDimitry Andric     else
5179dba64beSDimitry Andric       type = PyRefType::Owned;
5189dba64beSDimitry Andric     py_obj = l;
5190b57cec5SDimitry Andric   }
5200b57cec5SDimitry Andric #endif
5210b57cec5SDimitry Andric }
5220b57cec5SDimitry Andric 
5230b57cec5SDimitry Andric void PythonInteger::SetInteger(int64_t value) {
5249dba64beSDimitry Andric   *this = Take<PythonInteger>(PyLong_FromLongLong(value));
5250b57cec5SDimitry Andric }
5260b57cec5SDimitry Andric 
5270b57cec5SDimitry Andric StructuredData::IntegerSP PythonInteger::CreateStructuredInteger() const {
5280b57cec5SDimitry Andric   StructuredData::IntegerSP result(new StructuredData::Integer);
529*5ffd83dbSDimitry Andric   // FIXME this is really not ideal.   Errors are silently converted to 0
530*5ffd83dbSDimitry Andric   // and overflows are silently wrapped.   But we'd need larger changes
531*5ffd83dbSDimitry Andric   // to StructuredData to fix it, so that's how it is for now.
532*5ffd83dbSDimitry Andric   llvm::Expected<unsigned long long> value = AsModuloUnsignedLongLong();
533*5ffd83dbSDimitry Andric   if (!value) {
534*5ffd83dbSDimitry Andric     llvm::consumeError(value.takeError());
535*5ffd83dbSDimitry Andric     result->SetValue(0);
536*5ffd83dbSDimitry Andric   } else {
537*5ffd83dbSDimitry Andric     result->SetValue(value.get());
538*5ffd83dbSDimitry Andric   }
5390b57cec5SDimitry Andric   return result;
5400b57cec5SDimitry Andric }
5410b57cec5SDimitry Andric 
5420b57cec5SDimitry Andric // PythonBoolean
5430b57cec5SDimitry Andric 
5440b57cec5SDimitry Andric PythonBoolean::PythonBoolean(bool value) {
5450b57cec5SDimitry Andric   SetValue(value);
5460b57cec5SDimitry Andric }
5470b57cec5SDimitry Andric 
5480b57cec5SDimitry Andric bool PythonBoolean::Check(PyObject *py_obj) {
5490b57cec5SDimitry Andric   return py_obj ? PyBool_Check(py_obj) : false;
5500b57cec5SDimitry Andric }
5510b57cec5SDimitry Andric 
5520b57cec5SDimitry Andric bool PythonBoolean::GetValue() const {
5530b57cec5SDimitry Andric   return m_py_obj ? PyObject_IsTrue(m_py_obj) : false;
5540b57cec5SDimitry Andric }
5550b57cec5SDimitry Andric 
5560b57cec5SDimitry Andric void PythonBoolean::SetValue(bool value) {
5579dba64beSDimitry Andric   *this = Take<PythonBoolean>(PyBool_FromLong(value));
5580b57cec5SDimitry Andric }
5590b57cec5SDimitry Andric 
5600b57cec5SDimitry Andric StructuredData::BooleanSP PythonBoolean::CreateStructuredBoolean() const {
5610b57cec5SDimitry Andric   StructuredData::BooleanSP result(new StructuredData::Boolean);
5620b57cec5SDimitry Andric   result->SetValue(GetValue());
5630b57cec5SDimitry Andric   return result;
5640b57cec5SDimitry Andric }
5650b57cec5SDimitry Andric 
5660b57cec5SDimitry Andric // PythonList
5670b57cec5SDimitry Andric 
5689dba64beSDimitry Andric PythonList::PythonList(PyInitialValue value) {
5690b57cec5SDimitry Andric   if (value == PyInitialValue::Empty)
5709dba64beSDimitry Andric     *this = Take<PythonList>(PyList_New(0));
5710b57cec5SDimitry Andric }
5720b57cec5SDimitry Andric 
5739dba64beSDimitry Andric PythonList::PythonList(int list_size) {
5749dba64beSDimitry Andric   *this = Take<PythonList>(PyList_New(list_size));
5750b57cec5SDimitry Andric }
5760b57cec5SDimitry Andric 
5770b57cec5SDimitry Andric bool PythonList::Check(PyObject *py_obj) {
5780b57cec5SDimitry Andric   if (!py_obj)
5790b57cec5SDimitry Andric     return false;
5800b57cec5SDimitry Andric   return PyList_Check(py_obj);
5810b57cec5SDimitry Andric }
5820b57cec5SDimitry Andric 
5830b57cec5SDimitry Andric uint32_t PythonList::GetSize() const {
5840b57cec5SDimitry Andric   if (IsValid())
5850b57cec5SDimitry Andric     return PyList_GET_SIZE(m_py_obj);
5860b57cec5SDimitry Andric   return 0;
5870b57cec5SDimitry Andric }
5880b57cec5SDimitry Andric 
5890b57cec5SDimitry Andric PythonObject PythonList::GetItemAtIndex(uint32_t index) const {
5900b57cec5SDimitry Andric   if (IsValid())
5910b57cec5SDimitry Andric     return PythonObject(PyRefType::Borrowed, PyList_GetItem(m_py_obj, index));
5920b57cec5SDimitry Andric   return PythonObject();
5930b57cec5SDimitry Andric }
5940b57cec5SDimitry Andric 
5950b57cec5SDimitry Andric void PythonList::SetItemAtIndex(uint32_t index, const PythonObject &object) {
5960b57cec5SDimitry Andric   if (IsAllocated() && object.IsValid()) {
5970b57cec5SDimitry Andric     // PyList_SetItem is documented to "steal" a reference, so we need to
5980b57cec5SDimitry Andric     // convert it to an owned reference by incrementing it.
5990b57cec5SDimitry Andric     Py_INCREF(object.get());
6000b57cec5SDimitry Andric     PyList_SetItem(m_py_obj, index, object.get());
6010b57cec5SDimitry Andric   }
6020b57cec5SDimitry Andric }
6030b57cec5SDimitry Andric 
6040b57cec5SDimitry Andric void PythonList::AppendItem(const PythonObject &object) {
6050b57cec5SDimitry Andric   if (IsAllocated() && object.IsValid()) {
6060b57cec5SDimitry Andric     // `PyList_Append` does *not* steal a reference, so do not call `Py_INCREF`
6070b57cec5SDimitry Andric     // here like we do with `PyList_SetItem`.
6080b57cec5SDimitry Andric     PyList_Append(m_py_obj, object.get());
6090b57cec5SDimitry Andric   }
6100b57cec5SDimitry Andric }
6110b57cec5SDimitry Andric 
6120b57cec5SDimitry Andric StructuredData::ArraySP PythonList::CreateStructuredArray() const {
6130b57cec5SDimitry Andric   StructuredData::ArraySP result(new StructuredData::Array);
6140b57cec5SDimitry Andric   uint32_t count = GetSize();
6150b57cec5SDimitry Andric   for (uint32_t i = 0; i < count; ++i) {
6160b57cec5SDimitry Andric     PythonObject obj = GetItemAtIndex(i);
6170b57cec5SDimitry Andric     result->AddItem(obj.CreateStructuredObject());
6180b57cec5SDimitry Andric   }
6190b57cec5SDimitry Andric   return result;
6200b57cec5SDimitry Andric }
6210b57cec5SDimitry Andric 
6220b57cec5SDimitry Andric // PythonTuple
6230b57cec5SDimitry Andric 
6249dba64beSDimitry Andric PythonTuple::PythonTuple(PyInitialValue value) {
6250b57cec5SDimitry Andric   if (value == PyInitialValue::Empty)
6269dba64beSDimitry Andric     *this = Take<PythonTuple>(PyTuple_New(0));
6270b57cec5SDimitry Andric }
6280b57cec5SDimitry Andric 
6299dba64beSDimitry Andric PythonTuple::PythonTuple(int tuple_size) {
6309dba64beSDimitry Andric   *this = Take<PythonTuple>(PyTuple_New(tuple_size));
6310b57cec5SDimitry Andric }
6320b57cec5SDimitry Andric 
6330b57cec5SDimitry Andric PythonTuple::PythonTuple(std::initializer_list<PythonObject> objects) {
6340b57cec5SDimitry Andric   m_py_obj = PyTuple_New(objects.size());
6350b57cec5SDimitry Andric 
6360b57cec5SDimitry Andric   uint32_t idx = 0;
6370b57cec5SDimitry Andric   for (auto object : objects) {
6380b57cec5SDimitry Andric     if (object.IsValid())
6390b57cec5SDimitry Andric       SetItemAtIndex(idx, object);
6400b57cec5SDimitry Andric     idx++;
6410b57cec5SDimitry Andric   }
6420b57cec5SDimitry Andric }
6430b57cec5SDimitry Andric 
6440b57cec5SDimitry Andric PythonTuple::PythonTuple(std::initializer_list<PyObject *> objects) {
6450b57cec5SDimitry Andric   m_py_obj = PyTuple_New(objects.size());
6460b57cec5SDimitry Andric 
6470b57cec5SDimitry Andric   uint32_t idx = 0;
6480b57cec5SDimitry Andric   for (auto py_object : objects) {
6490b57cec5SDimitry Andric     PythonObject object(PyRefType::Borrowed, py_object);
6500b57cec5SDimitry Andric     if (object.IsValid())
6510b57cec5SDimitry Andric       SetItemAtIndex(idx, object);
6520b57cec5SDimitry Andric     idx++;
6530b57cec5SDimitry Andric   }
6540b57cec5SDimitry Andric }
6550b57cec5SDimitry Andric 
6560b57cec5SDimitry Andric bool PythonTuple::Check(PyObject *py_obj) {
6570b57cec5SDimitry Andric   if (!py_obj)
6580b57cec5SDimitry Andric     return false;
6590b57cec5SDimitry Andric   return PyTuple_Check(py_obj);
6600b57cec5SDimitry Andric }
6610b57cec5SDimitry Andric 
6620b57cec5SDimitry Andric uint32_t PythonTuple::GetSize() const {
6630b57cec5SDimitry Andric   if (IsValid())
6640b57cec5SDimitry Andric     return PyTuple_GET_SIZE(m_py_obj);
6650b57cec5SDimitry Andric   return 0;
6660b57cec5SDimitry Andric }
6670b57cec5SDimitry Andric 
6680b57cec5SDimitry Andric PythonObject PythonTuple::GetItemAtIndex(uint32_t index) const {
6690b57cec5SDimitry Andric   if (IsValid())
6700b57cec5SDimitry Andric     return PythonObject(PyRefType::Borrowed, PyTuple_GetItem(m_py_obj, index));
6710b57cec5SDimitry Andric   return PythonObject();
6720b57cec5SDimitry Andric }
6730b57cec5SDimitry Andric 
6740b57cec5SDimitry Andric void PythonTuple::SetItemAtIndex(uint32_t index, const PythonObject &object) {
6750b57cec5SDimitry Andric   if (IsAllocated() && object.IsValid()) {
6760b57cec5SDimitry Andric     // PyTuple_SetItem is documented to "steal" a reference, so we need to
6770b57cec5SDimitry Andric     // convert it to an owned reference by incrementing it.
6780b57cec5SDimitry Andric     Py_INCREF(object.get());
6790b57cec5SDimitry Andric     PyTuple_SetItem(m_py_obj, index, object.get());
6800b57cec5SDimitry Andric   }
6810b57cec5SDimitry Andric }
6820b57cec5SDimitry Andric 
6830b57cec5SDimitry Andric StructuredData::ArraySP PythonTuple::CreateStructuredArray() const {
6840b57cec5SDimitry Andric   StructuredData::ArraySP result(new StructuredData::Array);
6850b57cec5SDimitry Andric   uint32_t count = GetSize();
6860b57cec5SDimitry Andric   for (uint32_t i = 0; i < count; ++i) {
6870b57cec5SDimitry Andric     PythonObject obj = GetItemAtIndex(i);
6880b57cec5SDimitry Andric     result->AddItem(obj.CreateStructuredObject());
6890b57cec5SDimitry Andric   }
6900b57cec5SDimitry Andric   return result;
6910b57cec5SDimitry Andric }
6920b57cec5SDimitry Andric 
6930b57cec5SDimitry Andric // PythonDictionary
6940b57cec5SDimitry Andric 
6959dba64beSDimitry Andric PythonDictionary::PythonDictionary(PyInitialValue value) {
6960b57cec5SDimitry Andric   if (value == PyInitialValue::Empty)
6979dba64beSDimitry Andric     *this = Take<PythonDictionary>(PyDict_New());
6980b57cec5SDimitry Andric }
6990b57cec5SDimitry Andric 
7000b57cec5SDimitry Andric bool PythonDictionary::Check(PyObject *py_obj) {
7010b57cec5SDimitry Andric   if (!py_obj)
7020b57cec5SDimitry Andric     return false;
7030b57cec5SDimitry Andric 
7040b57cec5SDimitry Andric   return PyDict_Check(py_obj);
7050b57cec5SDimitry Andric }
7060b57cec5SDimitry Andric 
7070b57cec5SDimitry Andric uint32_t PythonDictionary::GetSize() const {
7080b57cec5SDimitry Andric   if (IsValid())
7090b57cec5SDimitry Andric     return PyDict_Size(m_py_obj);
7100b57cec5SDimitry Andric   return 0;
7110b57cec5SDimitry Andric }
7120b57cec5SDimitry Andric 
7130b57cec5SDimitry Andric PythonList PythonDictionary::GetKeys() const {
7140b57cec5SDimitry Andric   if (IsValid())
7150b57cec5SDimitry Andric     return PythonList(PyRefType::Owned, PyDict_Keys(m_py_obj));
7160b57cec5SDimitry Andric   return PythonList(PyInitialValue::Invalid);
7170b57cec5SDimitry Andric }
7180b57cec5SDimitry Andric 
7190b57cec5SDimitry Andric PythonObject PythonDictionary::GetItemForKey(const PythonObject &key) const {
7209dba64beSDimitry Andric   auto item = GetItem(key);
7219dba64beSDimitry Andric   if (!item) {
7229dba64beSDimitry Andric     llvm::consumeError(item.takeError());
7230b57cec5SDimitry Andric     return PythonObject();
7240b57cec5SDimitry Andric   }
7259dba64beSDimitry Andric   return std::move(item.get());
7269dba64beSDimitry Andric }
7279dba64beSDimitry Andric 
7289dba64beSDimitry Andric Expected<PythonObject>
7299dba64beSDimitry Andric PythonDictionary::GetItem(const PythonObject &key) const {
7309dba64beSDimitry Andric   if (!IsValid())
7319dba64beSDimitry Andric     return nullDeref();
7329dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3
7339dba64beSDimitry Andric   PyObject *o = PyDict_GetItemWithError(m_py_obj, key.get());
7349dba64beSDimitry Andric   if (PyErr_Occurred())
7359dba64beSDimitry Andric     return exception();
7369dba64beSDimitry Andric #else
7379dba64beSDimitry Andric   PyObject *o = PyDict_GetItem(m_py_obj, key.get());
7389dba64beSDimitry Andric #endif
7399dba64beSDimitry Andric   if (!o)
7409dba64beSDimitry Andric     return keyError();
7419dba64beSDimitry Andric   return Retain<PythonObject>(o);
7429dba64beSDimitry Andric }
7439dba64beSDimitry Andric 
7449dba64beSDimitry Andric Expected<PythonObject> PythonDictionary::GetItem(const Twine &key) const {
7459dba64beSDimitry Andric   if (!IsValid())
7469dba64beSDimitry Andric     return nullDeref();
7479dba64beSDimitry Andric   PyObject *o = PyDict_GetItemString(m_py_obj, NullTerminated(key));
7489dba64beSDimitry Andric   if (PyErr_Occurred())
7499dba64beSDimitry Andric     return exception();
7509dba64beSDimitry Andric   if (!o)
7519dba64beSDimitry Andric     return keyError();
7529dba64beSDimitry Andric   return Retain<PythonObject>(o);
7539dba64beSDimitry Andric }
7549dba64beSDimitry Andric 
7559dba64beSDimitry Andric Error PythonDictionary::SetItem(const PythonObject &key,
7569dba64beSDimitry Andric                                 const PythonObject &value) const {
7579dba64beSDimitry Andric   if (!IsValid() || !value.IsValid())
7589dba64beSDimitry Andric     return nullDeref();
7599dba64beSDimitry Andric   int r = PyDict_SetItem(m_py_obj, key.get(), value.get());
7609dba64beSDimitry Andric   if (r < 0)
7619dba64beSDimitry Andric     return exception();
7629dba64beSDimitry Andric   return Error::success();
7639dba64beSDimitry Andric }
7649dba64beSDimitry Andric 
7659dba64beSDimitry Andric Error PythonDictionary::SetItem(const Twine &key,
7669dba64beSDimitry Andric                                 const PythonObject &value) const {
7679dba64beSDimitry Andric   if (!IsValid() || !value.IsValid())
7689dba64beSDimitry Andric     return nullDeref();
7699dba64beSDimitry Andric   int r = PyDict_SetItemString(m_py_obj, NullTerminated(key), value.get());
7709dba64beSDimitry Andric   if (r < 0)
7719dba64beSDimitry Andric     return exception();
7729dba64beSDimitry Andric   return Error::success();
7739dba64beSDimitry Andric }
7740b57cec5SDimitry Andric 
7750b57cec5SDimitry Andric void PythonDictionary::SetItemForKey(const PythonObject &key,
7760b57cec5SDimitry Andric                                      const PythonObject &value) {
7779dba64beSDimitry Andric   Error error = SetItem(key, value);
7789dba64beSDimitry Andric   if (error)
7799dba64beSDimitry Andric     llvm::consumeError(std::move(error));
7800b57cec5SDimitry Andric }
7810b57cec5SDimitry Andric 
7820b57cec5SDimitry Andric StructuredData::DictionarySP
7830b57cec5SDimitry Andric PythonDictionary::CreateStructuredDictionary() const {
7840b57cec5SDimitry Andric   StructuredData::DictionarySP result(new StructuredData::Dictionary);
7850b57cec5SDimitry Andric   PythonList keys(GetKeys());
7860b57cec5SDimitry Andric   uint32_t num_keys = keys.GetSize();
7870b57cec5SDimitry Andric   for (uint32_t i = 0; i < num_keys; ++i) {
7880b57cec5SDimitry Andric     PythonObject key = keys.GetItemAtIndex(i);
7890b57cec5SDimitry Andric     PythonObject value = GetItemForKey(key);
7900b57cec5SDimitry Andric     StructuredData::ObjectSP structured_value = value.CreateStructuredObject();
7910b57cec5SDimitry Andric     result->AddItem(key.Str().GetString(), structured_value);
7920b57cec5SDimitry Andric   }
7930b57cec5SDimitry Andric   return result;
7940b57cec5SDimitry Andric }
7950b57cec5SDimitry Andric 
7960b57cec5SDimitry Andric PythonModule PythonModule::BuiltinsModule() {
7970b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3
7980b57cec5SDimitry Andric   return AddModule("builtins");
7990b57cec5SDimitry Andric #else
8000b57cec5SDimitry Andric   return AddModule("__builtin__");
8010b57cec5SDimitry Andric #endif
8020b57cec5SDimitry Andric }
8030b57cec5SDimitry Andric 
8040b57cec5SDimitry Andric PythonModule PythonModule::MainModule() { return AddModule("__main__"); }
8050b57cec5SDimitry Andric 
8060b57cec5SDimitry Andric PythonModule PythonModule::AddModule(llvm::StringRef module) {
8070b57cec5SDimitry Andric   std::string str = module.str();
8080b57cec5SDimitry Andric   return PythonModule(PyRefType::Borrowed, PyImport_AddModule(str.c_str()));
8090b57cec5SDimitry Andric }
8100b57cec5SDimitry Andric 
8119dba64beSDimitry Andric Expected<PythonModule> PythonModule::Import(const Twine &name) {
8129dba64beSDimitry Andric   PyObject *mod = PyImport_ImportModule(NullTerminated(name));
8139dba64beSDimitry Andric   if (!mod)
8149dba64beSDimitry Andric     return exception();
8159dba64beSDimitry Andric   return Take<PythonModule>(mod);
8169dba64beSDimitry Andric }
8179dba64beSDimitry Andric 
8189dba64beSDimitry Andric Expected<PythonObject> PythonModule::Get(const Twine &name) {
8199dba64beSDimitry Andric   if (!IsValid())
8209dba64beSDimitry Andric     return nullDeref();
8219dba64beSDimitry Andric   PyObject *dict = PyModule_GetDict(m_py_obj);
8229dba64beSDimitry Andric   if (!dict)
8239dba64beSDimitry Andric     return exception();
8249dba64beSDimitry Andric   PyObject *item = PyDict_GetItemString(dict, NullTerminated(name));
8259dba64beSDimitry Andric   if (!item)
8269dba64beSDimitry Andric     return exception();
8279dba64beSDimitry Andric   return Retain<PythonObject>(item);
8280b57cec5SDimitry Andric }
8290b57cec5SDimitry Andric 
8300b57cec5SDimitry Andric bool PythonModule::Check(PyObject *py_obj) {
8310b57cec5SDimitry Andric   if (!py_obj)
8320b57cec5SDimitry Andric     return false;
8330b57cec5SDimitry Andric 
8340b57cec5SDimitry Andric   return PyModule_Check(py_obj);
8350b57cec5SDimitry Andric }
8360b57cec5SDimitry Andric 
8370b57cec5SDimitry Andric PythonDictionary PythonModule::GetDictionary() const {
8389dba64beSDimitry Andric   if (!IsValid())
8399dba64beSDimitry Andric     return PythonDictionary();
8409dba64beSDimitry Andric   return Retain<PythonDictionary>(PyModule_GetDict(m_py_obj));
8410b57cec5SDimitry Andric }
8420b57cec5SDimitry Andric 
8430b57cec5SDimitry Andric bool PythonCallable::Check(PyObject *py_obj) {
8440b57cec5SDimitry Andric   if (!py_obj)
8450b57cec5SDimitry Andric     return false;
8460b57cec5SDimitry Andric 
8470b57cec5SDimitry Andric   return PyCallable_Check(py_obj);
8480b57cec5SDimitry Andric }
8490b57cec5SDimitry Andric 
8509dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 && PY_MINOR_VERSION >= 3
8519dba64beSDimitry Andric static const char get_arg_info_script[] = R"(
8529dba64beSDimitry Andric from inspect import signature, Parameter, ismethod
8539dba64beSDimitry Andric from collections import namedtuple
854480093f4SDimitry Andric ArgInfo = namedtuple('ArgInfo', ['count', 'has_varargs'])
8559dba64beSDimitry Andric def main(f):
8569dba64beSDimitry Andric     count = 0
8579dba64beSDimitry Andric     varargs = False
8589dba64beSDimitry Andric     for parameter in signature(f).parameters.values():
8599dba64beSDimitry Andric         kind = parameter.kind
8609dba64beSDimitry Andric         if kind in (Parameter.POSITIONAL_ONLY,
8619dba64beSDimitry Andric                     Parameter.POSITIONAL_OR_KEYWORD):
8629dba64beSDimitry Andric             count += 1
8639dba64beSDimitry Andric         elif kind == Parameter.VAR_POSITIONAL:
8649dba64beSDimitry Andric             varargs = True
8659dba64beSDimitry Andric         elif kind in (Parameter.KEYWORD_ONLY,
8669dba64beSDimitry Andric                       Parameter.VAR_KEYWORD):
8679dba64beSDimitry Andric             pass
8689dba64beSDimitry Andric         else:
8699dba64beSDimitry Andric             raise Exception(f'unknown parameter kind: {kind}')
870480093f4SDimitry Andric     return ArgInfo(count, varargs)
8719dba64beSDimitry Andric )";
8729dba64beSDimitry Andric #endif
8739dba64beSDimitry Andric 
8749dba64beSDimitry Andric Expected<PythonCallable::ArgInfo> PythonCallable::GetArgInfo() const {
8759dba64beSDimitry Andric   ArgInfo result = {};
8769dba64beSDimitry Andric   if (!IsValid())
8779dba64beSDimitry Andric     return nullDeref();
8789dba64beSDimitry Andric 
8799dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 && PY_MINOR_VERSION >= 3
8809dba64beSDimitry Andric 
8819dba64beSDimitry Andric   // no need to synchronize access to this global, we already have the GIL
8829dba64beSDimitry Andric   static PythonScript get_arg_info(get_arg_info_script);
8839dba64beSDimitry Andric   Expected<PythonObject> pyarginfo = get_arg_info(*this);
8849dba64beSDimitry Andric   if (!pyarginfo)
8859dba64beSDimitry Andric     return pyarginfo.takeError();
886480093f4SDimitry Andric   long long count =
887480093f4SDimitry Andric       cantFail(As<long long>(pyarginfo.get().GetAttribute("count")));
888480093f4SDimitry Andric   bool has_varargs =
8899dba64beSDimitry Andric       cantFail(As<bool>(pyarginfo.get().GetAttribute("has_varargs")));
890480093f4SDimitry Andric   result.max_positional_args = has_varargs ? ArgInfo::UNBOUNDED : count;
8919dba64beSDimitry Andric 
8929dba64beSDimitry Andric #else
893480093f4SDimitry Andric   PyObject *py_func_obj;
8949dba64beSDimitry Andric   bool is_bound_method = false;
895480093f4SDimitry Andric   bool is_class = false;
896480093f4SDimitry Andric 
897480093f4SDimitry Andric   if (PyType_Check(m_py_obj) || PyClass_Check(m_py_obj)) {
898480093f4SDimitry Andric     auto init = GetAttribute("__init__");
899480093f4SDimitry Andric     if (!init)
900480093f4SDimitry Andric       return init.takeError();
901480093f4SDimitry Andric     py_func_obj = init.get().get();
902480093f4SDimitry Andric     is_class = true;
903480093f4SDimitry Andric   } else {
904480093f4SDimitry Andric     py_func_obj = m_py_obj;
905480093f4SDimitry Andric   }
906480093f4SDimitry Andric 
9070b57cec5SDimitry Andric   if (PyMethod_Check(py_func_obj)) {
9080b57cec5SDimitry Andric     py_func_obj = PyMethod_GET_FUNCTION(py_func_obj);
9090b57cec5SDimitry Andric     PythonObject im_self = GetAttributeValue("im_self");
9100b57cec5SDimitry Andric     if (im_self.IsValid() && !im_self.IsNone())
9119dba64beSDimitry Andric       is_bound_method = true;
9120b57cec5SDimitry Andric   } else {
9130b57cec5SDimitry Andric     // see if this is a callable object with an __call__ method
9140b57cec5SDimitry Andric     if (!PyFunction_Check(py_func_obj)) {
9150b57cec5SDimitry Andric       PythonObject __call__ = GetAttributeValue("__call__");
9160b57cec5SDimitry Andric       if (__call__.IsValid()) {
9170b57cec5SDimitry Andric         auto __callable__ = __call__.AsType<PythonCallable>();
9180b57cec5SDimitry Andric         if (__callable__.IsValid()) {
9190b57cec5SDimitry Andric           py_func_obj = PyMethod_GET_FUNCTION(__callable__.get());
9209dba64beSDimitry Andric           PythonObject im_self = __callable__.GetAttributeValue("im_self");
9210b57cec5SDimitry Andric           if (im_self.IsValid() && !im_self.IsNone())
9229dba64beSDimitry Andric             is_bound_method = true;
9230b57cec5SDimitry Andric         }
9240b57cec5SDimitry Andric       }
9250b57cec5SDimitry Andric     }
9260b57cec5SDimitry Andric   }
9270b57cec5SDimitry Andric 
9280b57cec5SDimitry Andric   if (!py_func_obj)
9290b57cec5SDimitry Andric     return result;
9300b57cec5SDimitry Andric 
9310b57cec5SDimitry Andric   PyCodeObject *code = (PyCodeObject *)PyFunction_GET_CODE(py_func_obj);
9320b57cec5SDimitry Andric   if (!code)
9330b57cec5SDimitry Andric     return result;
9340b57cec5SDimitry Andric 
935480093f4SDimitry Andric   auto count = code->co_argcount;
936480093f4SDimitry Andric   bool has_varargs = !!(code->co_flags & CO_VARARGS);
937480093f4SDimitry Andric   result.max_positional_args =
938480093f4SDimitry Andric       has_varargs ? ArgInfo::UNBOUNDED
939480093f4SDimitry Andric                   : (count - (int)is_bound_method) - (int)is_class;
9409dba64beSDimitry Andric 
9419dba64beSDimitry Andric #endif
9429dba64beSDimitry Andric 
9430b57cec5SDimitry Andric   return result;
9440b57cec5SDimitry Andric }
9450b57cec5SDimitry Andric 
9469dba64beSDimitry Andric constexpr unsigned
9479dba64beSDimitry Andric     PythonCallable::ArgInfo::UNBOUNDED; // FIXME delete after c++17
9489dba64beSDimitry Andric 
9490b57cec5SDimitry Andric PythonObject PythonCallable::operator()() {
9500b57cec5SDimitry Andric   return PythonObject(PyRefType::Owned, PyObject_CallObject(m_py_obj, nullptr));
9510b57cec5SDimitry Andric }
9520b57cec5SDimitry Andric 
9530b57cec5SDimitry Andric PythonObject PythonCallable::
9540b57cec5SDimitry Andric operator()(std::initializer_list<PyObject *> args) {
9550b57cec5SDimitry Andric   PythonTuple arg_tuple(args);
9560b57cec5SDimitry Andric   return PythonObject(PyRefType::Owned,
9570b57cec5SDimitry Andric                       PyObject_CallObject(m_py_obj, arg_tuple.get()));
9580b57cec5SDimitry Andric }
9590b57cec5SDimitry Andric 
9600b57cec5SDimitry Andric PythonObject PythonCallable::
9610b57cec5SDimitry Andric operator()(std::initializer_list<PythonObject> args) {
9620b57cec5SDimitry Andric   PythonTuple arg_tuple(args);
9630b57cec5SDimitry Andric   return PythonObject(PyRefType::Owned,
9640b57cec5SDimitry Andric                       PyObject_CallObject(m_py_obj, arg_tuple.get()));
9650b57cec5SDimitry Andric }
9660b57cec5SDimitry Andric 
9670b57cec5SDimitry Andric bool PythonFile::Check(PyObject *py_obj) {
9689dba64beSDimitry Andric   if (!py_obj)
9699dba64beSDimitry Andric     return false;
9700b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3
9710b57cec5SDimitry Andric   return PyFile_Check(py_obj);
9720b57cec5SDimitry Andric #else
9730b57cec5SDimitry Andric   // In Python 3, there is no `PyFile_Check`, and in fact PyFile is not even a
9740b57cec5SDimitry Andric   // first-class object type anymore.  `PyFile_FromFd` is just a thin wrapper
9750b57cec5SDimitry Andric   // over `io.open()`, which returns some object derived from `io.IOBase`. As a
9760b57cec5SDimitry Andric   // result, the only way to detect a file in Python 3 is to check whether it
9779dba64beSDimitry Andric   // inherits from `io.IOBase`.
9789dba64beSDimitry Andric   auto io_module = PythonModule::Import("io");
9799dba64beSDimitry Andric   if (!io_module) {
9809dba64beSDimitry Andric     llvm::consumeError(io_module.takeError());
9810b57cec5SDimitry Andric     return false;
9829dba64beSDimitry Andric   }
9839dba64beSDimitry Andric   auto iobase = io_module.get().Get("IOBase");
9849dba64beSDimitry Andric   if (!iobase) {
9859dba64beSDimitry Andric     llvm::consumeError(iobase.takeError());
9860b57cec5SDimitry Andric     return false;
9879dba64beSDimitry Andric   }
9889dba64beSDimitry Andric   int r = PyObject_IsInstance(py_obj, iobase.get().get());
9899dba64beSDimitry Andric   if (r < 0) {
9909dba64beSDimitry Andric     llvm::consumeError(exception()); // clear the exception and log it.
9919dba64beSDimitry Andric     return false;
9929dba64beSDimitry Andric   }
9939dba64beSDimitry Andric   return !!r;
9940b57cec5SDimitry Andric #endif
9950b57cec5SDimitry Andric }
9960b57cec5SDimitry Andric 
9979dba64beSDimitry Andric namespace {
9989dba64beSDimitry Andric class GIL {
9999dba64beSDimitry Andric public:
10009dba64beSDimitry Andric   GIL() {
10019dba64beSDimitry Andric     m_state = PyGILState_Ensure();
10029dba64beSDimitry Andric     assert(!PyErr_Occurred());
10039dba64beSDimitry Andric   }
10049dba64beSDimitry Andric   ~GIL() { PyGILState_Release(m_state); }
10050b57cec5SDimitry Andric 
10069dba64beSDimitry Andric protected:
10079dba64beSDimitry Andric   PyGILState_STATE m_state;
10089dba64beSDimitry Andric };
10099dba64beSDimitry Andric } // namespace
10109dba64beSDimitry Andric 
10119dba64beSDimitry Andric const char *PythonException::toCString() const {
10129dba64beSDimitry Andric   if (!m_repr_bytes)
10139dba64beSDimitry Andric     return "unknown exception";
10149dba64beSDimitry Andric   return PyBytes_AS_STRING(m_repr_bytes);
10150b57cec5SDimitry Andric }
10160b57cec5SDimitry Andric 
10179dba64beSDimitry Andric PythonException::PythonException(const char *caller) {
10189dba64beSDimitry Andric   assert(PyErr_Occurred());
10199dba64beSDimitry Andric   m_exception_type = m_exception = m_traceback = m_repr_bytes = NULL;
10209dba64beSDimitry Andric   PyErr_Fetch(&m_exception_type, &m_exception, &m_traceback);
10219dba64beSDimitry Andric   PyErr_NormalizeException(&m_exception_type, &m_exception, &m_traceback);
10229dba64beSDimitry Andric   PyErr_Clear();
10239dba64beSDimitry Andric   if (m_exception) {
10249dba64beSDimitry Andric     PyObject *repr = PyObject_Repr(m_exception);
10259dba64beSDimitry Andric     if (repr) {
10269dba64beSDimitry Andric       m_repr_bytes = PyUnicode_AsEncodedString(repr, "utf-8", nullptr);
10279dba64beSDimitry Andric       if (!m_repr_bytes) {
10289dba64beSDimitry Andric         PyErr_Clear();
10299dba64beSDimitry Andric       }
10309dba64beSDimitry Andric       Py_XDECREF(repr);
10319dba64beSDimitry Andric     } else {
10329dba64beSDimitry Andric       PyErr_Clear();
10339dba64beSDimitry Andric     }
10349dba64beSDimitry Andric   }
10359dba64beSDimitry Andric   Log *log = GetLogIfAllCategoriesSet(LIBLLDB_LOG_SCRIPT);
10369dba64beSDimitry Andric   if (caller)
10379dba64beSDimitry Andric     LLDB_LOGF(log, "%s failed with exception: %s", caller, toCString());
10389dba64beSDimitry Andric   else
10399dba64beSDimitry Andric     LLDB_LOGF(log, "python exception: %s", toCString());
10409dba64beSDimitry Andric }
10419dba64beSDimitry Andric void PythonException::Restore() {
10429dba64beSDimitry Andric   if (m_exception_type && m_exception) {
10439dba64beSDimitry Andric     PyErr_Restore(m_exception_type, m_exception, m_traceback);
10449dba64beSDimitry Andric   } else {
10459dba64beSDimitry Andric     PyErr_SetString(PyExc_Exception, toCString());
10469dba64beSDimitry Andric   }
10479dba64beSDimitry Andric   m_exception_type = m_exception = m_traceback = NULL;
10480b57cec5SDimitry Andric }
10490b57cec5SDimitry Andric 
10509dba64beSDimitry Andric PythonException::~PythonException() {
10519dba64beSDimitry Andric   Py_XDECREF(m_exception_type);
10529dba64beSDimitry Andric   Py_XDECREF(m_exception);
10539dba64beSDimitry Andric   Py_XDECREF(m_traceback);
10549dba64beSDimitry Andric   Py_XDECREF(m_repr_bytes);
10550b57cec5SDimitry Andric }
10560b57cec5SDimitry Andric 
10579dba64beSDimitry Andric void PythonException::log(llvm::raw_ostream &OS) const { OS << toCString(); }
10589dba64beSDimitry Andric 
10599dba64beSDimitry Andric std::error_code PythonException::convertToErrorCode() const {
10609dba64beSDimitry Andric   return llvm::inconvertibleErrorCode();
10619dba64beSDimitry Andric }
10629dba64beSDimitry Andric 
10639dba64beSDimitry Andric bool PythonException::Matches(PyObject *exc) const {
10649dba64beSDimitry Andric   return PyErr_GivenExceptionMatches(m_exception_type, exc);
10659dba64beSDimitry Andric }
10669dba64beSDimitry Andric 
10679dba64beSDimitry Andric const char read_exception_script[] = R"(
10689dba64beSDimitry Andric import sys
10699dba64beSDimitry Andric from traceback import print_exception
10709dba64beSDimitry Andric if sys.version_info.major < 3:
10719dba64beSDimitry Andric   from StringIO import StringIO
10729dba64beSDimitry Andric else:
10739dba64beSDimitry Andric   from io import StringIO
10749dba64beSDimitry Andric def main(exc_type, exc_value, tb):
10759dba64beSDimitry Andric   f = StringIO()
10769dba64beSDimitry Andric   print_exception(exc_type, exc_value, tb, file=f)
10779dba64beSDimitry Andric   return f.getvalue()
10789dba64beSDimitry Andric )";
10799dba64beSDimitry Andric 
10809dba64beSDimitry Andric std::string PythonException::ReadBacktrace() const {
10819dba64beSDimitry Andric 
10829dba64beSDimitry Andric   if (!m_traceback)
10839dba64beSDimitry Andric     return toCString();
10849dba64beSDimitry Andric 
10859dba64beSDimitry Andric   // no need to synchronize access to this global, we already have the GIL
10869dba64beSDimitry Andric   static PythonScript read_exception(read_exception_script);
10879dba64beSDimitry Andric 
10889dba64beSDimitry Andric   Expected<std::string> backtrace = As<std::string>(
10899dba64beSDimitry Andric       read_exception(m_exception_type, m_exception, m_traceback));
10909dba64beSDimitry Andric 
10919dba64beSDimitry Andric   if (!backtrace) {
10929dba64beSDimitry Andric     std::string message =
10939dba64beSDimitry Andric         std::string(toCString()) + "\n" +
1094*5ffd83dbSDimitry Andric         "Traceback unavailable, an error occurred while reading it:\n";
10959dba64beSDimitry Andric     return (message + llvm::toString(backtrace.takeError()));
10969dba64beSDimitry Andric   }
10979dba64beSDimitry Andric 
10989dba64beSDimitry Andric   return std::move(backtrace.get());
10999dba64beSDimitry Andric }
11009dba64beSDimitry Andric 
11019dba64beSDimitry Andric char PythonException::ID = 0;
11029dba64beSDimitry Andric 
11039dba64beSDimitry Andric llvm::Expected<File::OpenOptions>
11049dba64beSDimitry Andric GetOptionsForPyObject(const PythonObject &obj) {
11050b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3
11069dba64beSDimitry Andric   auto options = File::OpenOptions(0);
11079dba64beSDimitry Andric   auto readable = As<bool>(obj.CallMethod("readable"));
11089dba64beSDimitry Andric   if (!readable)
11099dba64beSDimitry Andric     return readable.takeError();
11109dba64beSDimitry Andric   auto writable = As<bool>(obj.CallMethod("writable"));
11119dba64beSDimitry Andric   if (!writable)
11129dba64beSDimitry Andric     return writable.takeError();
11139dba64beSDimitry Andric   if (readable.get())
11149dba64beSDimitry Andric     options |= File::eOpenOptionRead;
11159dba64beSDimitry Andric   if (writable.get())
11169dba64beSDimitry Andric     options |= File::eOpenOptionWrite;
11179dba64beSDimitry Andric   return options;
11189dba64beSDimitry Andric #else
11199dba64beSDimitry Andric   PythonString py_mode = obj.GetAttributeValue("mode").AsType<PythonString>();
11209dba64beSDimitry Andric   return File::GetOptionsFromMode(py_mode.GetString());
11219dba64beSDimitry Andric #endif
11229dba64beSDimitry Andric }
11239dba64beSDimitry Andric 
11249dba64beSDimitry Andric // Base class template for python files.   All it knows how to do
11259dba64beSDimitry Andric // is hold a reference to the python object and close or flush it
11269dba64beSDimitry Andric // when the File is closed.
11279dba64beSDimitry Andric namespace {
11289dba64beSDimitry Andric template <typename Base> class OwnedPythonFile : public Base {
11299dba64beSDimitry Andric public:
11309dba64beSDimitry Andric   template <typename... Args>
11319dba64beSDimitry Andric   OwnedPythonFile(const PythonFile &file, bool borrowed, Args... args)
11329dba64beSDimitry Andric       : Base(args...), m_py_obj(file), m_borrowed(borrowed) {
11339dba64beSDimitry Andric     assert(m_py_obj);
11349dba64beSDimitry Andric   }
11359dba64beSDimitry Andric 
11369dba64beSDimitry Andric   ~OwnedPythonFile() override {
11379dba64beSDimitry Andric     assert(m_py_obj);
11389dba64beSDimitry Andric     GIL takeGIL;
11399dba64beSDimitry Andric     Close();
11409dba64beSDimitry Andric     // we need to ensure the python object is released while we still
11419dba64beSDimitry Andric     // hold the GIL
11429dba64beSDimitry Andric     m_py_obj.Reset();
11439dba64beSDimitry Andric   }
11449dba64beSDimitry Andric 
11459dba64beSDimitry Andric   bool IsPythonSideValid() const {
11469dba64beSDimitry Andric     GIL takeGIL;
11479dba64beSDimitry Andric     auto closed = As<bool>(m_py_obj.GetAttribute("closed"));
11489dba64beSDimitry Andric     if (!closed) {
11499dba64beSDimitry Andric       llvm::consumeError(closed.takeError());
11509dba64beSDimitry Andric       return false;
11519dba64beSDimitry Andric     }
11529dba64beSDimitry Andric     return !closed.get();
11539dba64beSDimitry Andric   }
11549dba64beSDimitry Andric 
11559dba64beSDimitry Andric   bool IsValid() const override {
11569dba64beSDimitry Andric     return IsPythonSideValid() && Base::IsValid();
11579dba64beSDimitry Andric   }
11589dba64beSDimitry Andric 
11599dba64beSDimitry Andric   Status Close() override {
11609dba64beSDimitry Andric     assert(m_py_obj);
11619dba64beSDimitry Andric     Status py_error, base_error;
11629dba64beSDimitry Andric     GIL takeGIL;
11639dba64beSDimitry Andric     if (!m_borrowed) {
11649dba64beSDimitry Andric       auto r = m_py_obj.CallMethod("close");
11659dba64beSDimitry Andric       if (!r)
11669dba64beSDimitry Andric         py_error = Status(r.takeError());
11679dba64beSDimitry Andric     }
11689dba64beSDimitry Andric     base_error = Base::Close();
11699dba64beSDimitry Andric     if (py_error.Fail())
11709dba64beSDimitry Andric       return py_error;
11719dba64beSDimitry Andric     return base_error;
11729dba64beSDimitry Andric   };
11739dba64beSDimitry Andric 
11749dba64beSDimitry Andric   PyObject *GetPythonObject() const {
11759dba64beSDimitry Andric     assert(m_py_obj.IsValid());
11769dba64beSDimitry Andric     return m_py_obj.get();
11779dba64beSDimitry Andric   }
11789dba64beSDimitry Andric 
11799dba64beSDimitry Andric   static bool classof(const File *file) = delete;
11809dba64beSDimitry Andric 
11819dba64beSDimitry Andric protected:
11829dba64beSDimitry Andric   PythonFile m_py_obj;
11839dba64beSDimitry Andric   bool m_borrowed;
11849dba64beSDimitry Andric };
11859dba64beSDimitry Andric } // namespace
11869dba64beSDimitry Andric 
11879dba64beSDimitry Andric // A SimplePythonFile is a OwnedPythonFile that just does all I/O as
11889dba64beSDimitry Andric // a NativeFile
11899dba64beSDimitry Andric namespace {
11909dba64beSDimitry Andric class SimplePythonFile : public OwnedPythonFile<NativeFile> {
11919dba64beSDimitry Andric public:
11929dba64beSDimitry Andric   SimplePythonFile(const PythonFile &file, bool borrowed, int fd,
11939dba64beSDimitry Andric                    File::OpenOptions options)
11949dba64beSDimitry Andric       : OwnedPythonFile(file, borrowed, fd, options, false) {}
11959dba64beSDimitry Andric 
11969dba64beSDimitry Andric   static char ID;
11979dba64beSDimitry Andric   bool isA(const void *classID) const override {
11989dba64beSDimitry Andric     return classID == &ID || NativeFile::isA(classID);
11999dba64beSDimitry Andric   }
12009dba64beSDimitry Andric   static bool classof(const File *file) { return file->isA(&ID); }
12019dba64beSDimitry Andric };
12029dba64beSDimitry Andric char SimplePythonFile::ID = 0;
12039dba64beSDimitry Andric } // namespace
12049dba64beSDimitry Andric 
12059dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3
12069dba64beSDimitry Andric 
12079dba64beSDimitry Andric namespace {
12089dba64beSDimitry Andric class PythonBuffer {
12099dba64beSDimitry Andric public:
12109dba64beSDimitry Andric   PythonBuffer &operator=(const PythonBuffer &) = delete;
12119dba64beSDimitry Andric   PythonBuffer(const PythonBuffer &) = delete;
12129dba64beSDimitry Andric 
12139dba64beSDimitry Andric   static Expected<PythonBuffer> Create(PythonObject &obj,
12149dba64beSDimitry Andric                                        int flags = PyBUF_SIMPLE) {
12159dba64beSDimitry Andric     Py_buffer py_buffer = {};
12169dba64beSDimitry Andric     PyObject_GetBuffer(obj.get(), &py_buffer, flags);
12179dba64beSDimitry Andric     if (!py_buffer.obj)
12189dba64beSDimitry Andric       return llvm::make_error<PythonException>();
12199dba64beSDimitry Andric     return PythonBuffer(py_buffer);
12209dba64beSDimitry Andric   }
12219dba64beSDimitry Andric 
12229dba64beSDimitry Andric   PythonBuffer(PythonBuffer &&other) {
12239dba64beSDimitry Andric     m_buffer = other.m_buffer;
12249dba64beSDimitry Andric     other.m_buffer.obj = nullptr;
12259dba64beSDimitry Andric   }
12269dba64beSDimitry Andric 
12279dba64beSDimitry Andric   ~PythonBuffer() {
12289dba64beSDimitry Andric     if (m_buffer.obj)
12299dba64beSDimitry Andric       PyBuffer_Release(&m_buffer);
12309dba64beSDimitry Andric   }
12319dba64beSDimitry Andric 
12329dba64beSDimitry Andric   Py_buffer &get() { return m_buffer; }
12339dba64beSDimitry Andric 
12349dba64beSDimitry Andric private:
12359dba64beSDimitry Andric   // takes ownership of the buffer.
12369dba64beSDimitry Andric   PythonBuffer(const Py_buffer &py_buffer) : m_buffer(py_buffer) {}
12379dba64beSDimitry Andric   Py_buffer m_buffer;
12389dba64beSDimitry Andric };
12399dba64beSDimitry Andric } // namespace
12409dba64beSDimitry Andric 
12419dba64beSDimitry Andric // Shared methods between TextPythonFile and BinaryPythonFile
12429dba64beSDimitry Andric namespace {
12439dba64beSDimitry Andric class PythonIOFile : public OwnedPythonFile<File> {
12449dba64beSDimitry Andric public:
12459dba64beSDimitry Andric   PythonIOFile(const PythonFile &file, bool borrowed)
12469dba64beSDimitry Andric       : OwnedPythonFile(file, borrowed) {}
12479dba64beSDimitry Andric 
12489dba64beSDimitry Andric   ~PythonIOFile() override { Close(); }
12499dba64beSDimitry Andric 
12509dba64beSDimitry Andric   bool IsValid() const override { return IsPythonSideValid(); }
12519dba64beSDimitry Andric 
12529dba64beSDimitry Andric   Status Close() override {
12539dba64beSDimitry Andric     assert(m_py_obj);
12549dba64beSDimitry Andric     GIL takeGIL;
12559dba64beSDimitry Andric     if (m_borrowed)
12569dba64beSDimitry Andric       return Flush();
12579dba64beSDimitry Andric     auto r = m_py_obj.CallMethod("close");
12589dba64beSDimitry Andric     if (!r)
12599dba64beSDimitry Andric       return Status(r.takeError());
12609dba64beSDimitry Andric     return Status();
12619dba64beSDimitry Andric   }
12629dba64beSDimitry Andric 
12639dba64beSDimitry Andric   Status Flush() override {
12649dba64beSDimitry Andric     GIL takeGIL;
12659dba64beSDimitry Andric     auto r = m_py_obj.CallMethod("flush");
12669dba64beSDimitry Andric     if (!r)
12679dba64beSDimitry Andric       return Status(r.takeError());
12689dba64beSDimitry Andric     return Status();
12699dba64beSDimitry Andric   }
12709dba64beSDimitry Andric 
12719dba64beSDimitry Andric   Expected<File::OpenOptions> GetOptions() const override {
12729dba64beSDimitry Andric     GIL takeGIL;
12739dba64beSDimitry Andric     return GetOptionsForPyObject(m_py_obj);
12749dba64beSDimitry Andric   }
12759dba64beSDimitry Andric 
12769dba64beSDimitry Andric   static char ID;
12779dba64beSDimitry Andric   bool isA(const void *classID) const override {
12789dba64beSDimitry Andric     return classID == &ID || File::isA(classID);
12799dba64beSDimitry Andric   }
12809dba64beSDimitry Andric   static bool classof(const File *file) { return file->isA(&ID); }
12819dba64beSDimitry Andric };
12829dba64beSDimitry Andric char PythonIOFile::ID = 0;
12839dba64beSDimitry Andric } // namespace
12849dba64beSDimitry Andric 
12859dba64beSDimitry Andric namespace {
12869dba64beSDimitry Andric class BinaryPythonFile : public PythonIOFile {
12879dba64beSDimitry Andric protected:
12889dba64beSDimitry Andric   int m_descriptor;
12899dba64beSDimitry Andric 
12909dba64beSDimitry Andric public:
12919dba64beSDimitry Andric   BinaryPythonFile(int fd, const PythonFile &file, bool borrowed)
12929dba64beSDimitry Andric       : PythonIOFile(file, borrowed),
12939dba64beSDimitry Andric         m_descriptor(File::DescriptorIsValid(fd) ? fd
12949dba64beSDimitry Andric                                                  : File::kInvalidDescriptor) {}
12959dba64beSDimitry Andric 
12969dba64beSDimitry Andric   int GetDescriptor() const override { return m_descriptor; }
12979dba64beSDimitry Andric 
12989dba64beSDimitry Andric   Status Write(const void *buf, size_t &num_bytes) override {
12999dba64beSDimitry Andric     GIL takeGIL;
13009dba64beSDimitry Andric     PyObject *pybuffer_p = PyMemoryView_FromMemory(
13019dba64beSDimitry Andric         const_cast<char *>((const char *)buf), num_bytes, PyBUF_READ);
13029dba64beSDimitry Andric     if (!pybuffer_p)
13039dba64beSDimitry Andric       return Status(llvm::make_error<PythonException>());
13049dba64beSDimitry Andric     auto pybuffer = Take<PythonObject>(pybuffer_p);
13059dba64beSDimitry Andric     num_bytes = 0;
13069dba64beSDimitry Andric     auto bytes_written = As<long long>(m_py_obj.CallMethod("write", pybuffer));
13079dba64beSDimitry Andric     if (!bytes_written)
13089dba64beSDimitry Andric       return Status(bytes_written.takeError());
13099dba64beSDimitry Andric     if (bytes_written.get() < 0)
13109dba64beSDimitry Andric       return Status(".write() method returned a negative number!");
13119dba64beSDimitry Andric     static_assert(sizeof(long long) >= sizeof(size_t), "overflow");
13129dba64beSDimitry Andric     num_bytes = bytes_written.get();
13139dba64beSDimitry Andric     return Status();
13149dba64beSDimitry Andric   }
13159dba64beSDimitry Andric 
13169dba64beSDimitry Andric   Status Read(void *buf, size_t &num_bytes) override {
13179dba64beSDimitry Andric     GIL takeGIL;
13189dba64beSDimitry Andric     static_assert(sizeof(long long) >= sizeof(size_t), "overflow");
13199dba64beSDimitry Andric     auto pybuffer_obj =
13209dba64beSDimitry Andric         m_py_obj.CallMethod("read", (unsigned long long)num_bytes);
13219dba64beSDimitry Andric     if (!pybuffer_obj)
13229dba64beSDimitry Andric       return Status(pybuffer_obj.takeError());
13239dba64beSDimitry Andric     num_bytes = 0;
13249dba64beSDimitry Andric     if (pybuffer_obj.get().IsNone()) {
13259dba64beSDimitry Andric       // EOF
13269dba64beSDimitry Andric       num_bytes = 0;
13279dba64beSDimitry Andric       return Status();
13289dba64beSDimitry Andric     }
13299dba64beSDimitry Andric     auto pybuffer = PythonBuffer::Create(pybuffer_obj.get());
13309dba64beSDimitry Andric     if (!pybuffer)
13319dba64beSDimitry Andric       return Status(pybuffer.takeError());
13329dba64beSDimitry Andric     memcpy(buf, pybuffer.get().get().buf, pybuffer.get().get().len);
13339dba64beSDimitry Andric     num_bytes = pybuffer.get().get().len;
13349dba64beSDimitry Andric     return Status();
13359dba64beSDimitry Andric   }
13369dba64beSDimitry Andric };
13379dba64beSDimitry Andric } // namespace
13389dba64beSDimitry Andric 
13399dba64beSDimitry Andric namespace {
13409dba64beSDimitry Andric class TextPythonFile : public PythonIOFile {
13419dba64beSDimitry Andric protected:
13429dba64beSDimitry Andric   int m_descriptor;
13439dba64beSDimitry Andric 
13449dba64beSDimitry Andric public:
13459dba64beSDimitry Andric   TextPythonFile(int fd, const PythonFile &file, bool borrowed)
13469dba64beSDimitry Andric       : PythonIOFile(file, borrowed),
13479dba64beSDimitry Andric         m_descriptor(File::DescriptorIsValid(fd) ? fd
13489dba64beSDimitry Andric                                                  : File::kInvalidDescriptor) {}
13499dba64beSDimitry Andric 
13509dba64beSDimitry Andric   int GetDescriptor() const override { return m_descriptor; }
13519dba64beSDimitry Andric 
13529dba64beSDimitry Andric   Status Write(const void *buf, size_t &num_bytes) override {
13539dba64beSDimitry Andric     GIL takeGIL;
13549dba64beSDimitry Andric     auto pystring =
13559dba64beSDimitry Andric         PythonString::FromUTF8(llvm::StringRef((const char *)buf, num_bytes));
13569dba64beSDimitry Andric     if (!pystring)
13579dba64beSDimitry Andric       return Status(pystring.takeError());
13589dba64beSDimitry Andric     num_bytes = 0;
13599dba64beSDimitry Andric     auto bytes_written =
13609dba64beSDimitry Andric         As<long long>(m_py_obj.CallMethod("write", pystring.get()));
13619dba64beSDimitry Andric     if (!bytes_written)
13629dba64beSDimitry Andric       return Status(bytes_written.takeError());
13639dba64beSDimitry Andric     if (bytes_written.get() < 0)
13649dba64beSDimitry Andric       return Status(".write() method returned a negative number!");
13659dba64beSDimitry Andric     static_assert(sizeof(long long) >= sizeof(size_t), "overflow");
13669dba64beSDimitry Andric     num_bytes = bytes_written.get();
13679dba64beSDimitry Andric     return Status();
13689dba64beSDimitry Andric   }
13699dba64beSDimitry Andric 
13709dba64beSDimitry Andric   Status Read(void *buf, size_t &num_bytes) override {
13719dba64beSDimitry Andric     GIL takeGIL;
13729dba64beSDimitry Andric     size_t num_chars = num_bytes / 6;
13739dba64beSDimitry Andric     size_t orig_num_bytes = num_bytes;
13749dba64beSDimitry Andric     num_bytes = 0;
13759dba64beSDimitry Andric     if (orig_num_bytes < 6) {
13769dba64beSDimitry Andric       return Status("can't read less than 6 bytes from a utf8 text stream");
13779dba64beSDimitry Andric     }
13789dba64beSDimitry Andric     auto pystring = As<PythonString>(
13799dba64beSDimitry Andric         m_py_obj.CallMethod("read", (unsigned long long)num_chars));
13809dba64beSDimitry Andric     if (!pystring)
13819dba64beSDimitry Andric       return Status(pystring.takeError());
13829dba64beSDimitry Andric     if (pystring.get().IsNone()) {
13839dba64beSDimitry Andric       // EOF
13849dba64beSDimitry Andric       return Status();
13859dba64beSDimitry Andric     }
13869dba64beSDimitry Andric     auto stringref = pystring.get().AsUTF8();
13879dba64beSDimitry Andric     if (!stringref)
13889dba64beSDimitry Andric       return Status(stringref.takeError());
13899dba64beSDimitry Andric     num_bytes = stringref.get().size();
13909dba64beSDimitry Andric     memcpy(buf, stringref.get().begin(), num_bytes);
13919dba64beSDimitry Andric     return Status();
13929dba64beSDimitry Andric   }
13939dba64beSDimitry Andric };
13949dba64beSDimitry Andric } // namespace
13959dba64beSDimitry Andric 
13969dba64beSDimitry Andric #endif
13979dba64beSDimitry Andric 
13989dba64beSDimitry Andric llvm::Expected<FileSP> PythonFile::ConvertToFile(bool borrowed) {
13999dba64beSDimitry Andric   if (!IsValid())
14009dba64beSDimitry Andric     return llvm::createStringError(llvm::inconvertibleErrorCode(),
14019dba64beSDimitry Andric                                    "invalid PythonFile");
14029dba64beSDimitry Andric 
14039dba64beSDimitry Andric   int fd = PyObject_AsFileDescriptor(m_py_obj);
14049dba64beSDimitry Andric   if (fd < 0) {
14059dba64beSDimitry Andric     PyErr_Clear();
14069dba64beSDimitry Andric     return ConvertToFileForcingUseOfScriptingIOMethods(borrowed);
14079dba64beSDimitry Andric   }
14089dba64beSDimitry Andric   auto options = GetOptionsForPyObject(*this);
14099dba64beSDimitry Andric   if (!options)
14109dba64beSDimitry Andric     return options.takeError();
14119dba64beSDimitry Andric 
1412480093f4SDimitry Andric   if (options.get() & File::eOpenOptionWrite) {
14139dba64beSDimitry Andric     // LLDB and python will not share I/O buffers.  We should probably
14149dba64beSDimitry Andric     // flush the python buffers now.
14159dba64beSDimitry Andric     auto r = CallMethod("flush");
14169dba64beSDimitry Andric     if (!r)
14179dba64beSDimitry Andric       return r.takeError();
1418480093f4SDimitry Andric   }
14199dba64beSDimitry Andric 
14209dba64beSDimitry Andric   FileSP file_sp;
14219dba64beSDimitry Andric   if (borrowed) {
14229dba64beSDimitry Andric     // In this case we we don't need to retain the python
14239dba64beSDimitry Andric     // object at all.
14249dba64beSDimitry Andric     file_sp = std::make_shared<NativeFile>(fd, options.get(), false);
14259dba64beSDimitry Andric   } else {
14269dba64beSDimitry Andric     file_sp = std::static_pointer_cast<File>(
14279dba64beSDimitry Andric         std::make_shared<SimplePythonFile>(*this, borrowed, fd, options.get()));
14289dba64beSDimitry Andric   }
14299dba64beSDimitry Andric   if (!file_sp->IsValid())
14309dba64beSDimitry Andric     return llvm::createStringError(llvm::inconvertibleErrorCode(),
14319dba64beSDimitry Andric                                    "invalid File");
14329dba64beSDimitry Andric 
14339dba64beSDimitry Andric   return file_sp;
14349dba64beSDimitry Andric }
14359dba64beSDimitry Andric 
14369dba64beSDimitry Andric llvm::Expected<FileSP>
14379dba64beSDimitry Andric PythonFile::ConvertToFileForcingUseOfScriptingIOMethods(bool borrowed) {
14389dba64beSDimitry Andric 
14399dba64beSDimitry Andric   assert(!PyErr_Occurred());
14409dba64beSDimitry Andric 
14419dba64beSDimitry Andric   if (!IsValid())
14429dba64beSDimitry Andric     return llvm::createStringError(llvm::inconvertibleErrorCode(),
14439dba64beSDimitry Andric                                    "invalid PythonFile");
14449dba64beSDimitry Andric 
14459dba64beSDimitry Andric #if PY_MAJOR_VERSION < 3
14469dba64beSDimitry Andric 
14479dba64beSDimitry Andric   return llvm::createStringError(llvm::inconvertibleErrorCode(),
14489dba64beSDimitry Andric                                  "not supported on python 2");
14499dba64beSDimitry Andric 
14509dba64beSDimitry Andric #else
14519dba64beSDimitry Andric 
14529dba64beSDimitry Andric   int fd = PyObject_AsFileDescriptor(m_py_obj);
14539dba64beSDimitry Andric   if (fd < 0) {
14549dba64beSDimitry Andric     PyErr_Clear();
14559dba64beSDimitry Andric     fd = File::kInvalidDescriptor;
14569dba64beSDimitry Andric   }
14579dba64beSDimitry Andric 
14589dba64beSDimitry Andric   auto io_module = PythonModule::Import("io");
14599dba64beSDimitry Andric   if (!io_module)
14609dba64beSDimitry Andric     return io_module.takeError();
14619dba64beSDimitry Andric   auto textIOBase = io_module.get().Get("TextIOBase");
14629dba64beSDimitry Andric   if (!textIOBase)
14639dba64beSDimitry Andric     return textIOBase.takeError();
14649dba64beSDimitry Andric   auto rawIOBase = io_module.get().Get("RawIOBase");
14659dba64beSDimitry Andric   if (!rawIOBase)
14669dba64beSDimitry Andric     return rawIOBase.takeError();
14679dba64beSDimitry Andric   auto bufferedIOBase = io_module.get().Get("BufferedIOBase");
14689dba64beSDimitry Andric   if (!bufferedIOBase)
14699dba64beSDimitry Andric     return bufferedIOBase.takeError();
14709dba64beSDimitry Andric 
14719dba64beSDimitry Andric   FileSP file_sp;
14729dba64beSDimitry Andric 
14739dba64beSDimitry Andric   auto isTextIO = IsInstance(textIOBase.get());
14749dba64beSDimitry Andric   if (!isTextIO)
14759dba64beSDimitry Andric     return isTextIO.takeError();
14769dba64beSDimitry Andric   if (isTextIO.get())
14779dba64beSDimitry Andric     file_sp = std::static_pointer_cast<File>(
14789dba64beSDimitry Andric         std::make_shared<TextPythonFile>(fd, *this, borrowed));
14799dba64beSDimitry Andric 
14809dba64beSDimitry Andric   auto isRawIO = IsInstance(rawIOBase.get());
14819dba64beSDimitry Andric   if (!isRawIO)
14829dba64beSDimitry Andric     return isRawIO.takeError();
14839dba64beSDimitry Andric   auto isBufferedIO = IsInstance(bufferedIOBase.get());
14849dba64beSDimitry Andric   if (!isBufferedIO)
14859dba64beSDimitry Andric     return isBufferedIO.takeError();
14869dba64beSDimitry Andric 
14879dba64beSDimitry Andric   if (isRawIO.get() || isBufferedIO.get()) {
14889dba64beSDimitry Andric     file_sp = std::static_pointer_cast<File>(
14899dba64beSDimitry Andric         std::make_shared<BinaryPythonFile>(fd, *this, borrowed));
14909dba64beSDimitry Andric   }
14919dba64beSDimitry Andric 
14929dba64beSDimitry Andric   if (!file_sp)
14939dba64beSDimitry Andric     return llvm::createStringError(llvm::inconvertibleErrorCode(),
14949dba64beSDimitry Andric                                    "python file is neither text nor binary");
14959dba64beSDimitry Andric 
14969dba64beSDimitry Andric   if (!file_sp->IsValid())
14979dba64beSDimitry Andric     return llvm::createStringError(llvm::inconvertibleErrorCode(),
14989dba64beSDimitry Andric                                    "invalid File");
14999dba64beSDimitry Andric 
15009dba64beSDimitry Andric   return file_sp;
15019dba64beSDimitry Andric 
15029dba64beSDimitry Andric #endif
15039dba64beSDimitry Andric }
15049dba64beSDimitry Andric 
15059dba64beSDimitry Andric Expected<PythonFile> PythonFile::FromFile(File &file, const char *mode) {
15069dba64beSDimitry Andric   if (!file.IsValid())
15079dba64beSDimitry Andric     return llvm::createStringError(llvm::inconvertibleErrorCode(),
15089dba64beSDimitry Andric                                    "invalid file");
15099dba64beSDimitry Andric 
15109dba64beSDimitry Andric   if (auto *simple = llvm::dyn_cast<SimplePythonFile>(&file))
15119dba64beSDimitry Andric     return Retain<PythonFile>(simple->GetPythonObject());
15129dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3
15139dba64beSDimitry Andric   if (auto *pythonio = llvm::dyn_cast<PythonIOFile>(&file))
15149dba64beSDimitry Andric     return Retain<PythonFile>(pythonio->GetPythonObject());
15159dba64beSDimitry Andric #endif
15169dba64beSDimitry Andric 
15179dba64beSDimitry Andric   if (!mode) {
15189dba64beSDimitry Andric     auto m = file.GetOpenMode();
15199dba64beSDimitry Andric     if (!m)
15209dba64beSDimitry Andric       return m.takeError();
15219dba64beSDimitry Andric     mode = m.get();
15229dba64beSDimitry Andric   }
15239dba64beSDimitry Andric 
15249dba64beSDimitry Andric   PyObject *file_obj;
15259dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3
15269dba64beSDimitry Andric   file_obj = PyFile_FromFd(file.GetDescriptor(), nullptr, mode, -1, nullptr,
1527480093f4SDimitry Andric                            "ignore", nullptr, /*closefd=*/0);
15280b57cec5SDimitry Andric #else
1529480093f4SDimitry Andric   // I'd like to pass ::fflush here if the file is writable,  so that
1530480093f4SDimitry Andric   // when the python side destructs the file object it will be flushed.
1531480093f4SDimitry Andric   // However, this would be dangerous.    It can cause fflush to be called
1532480093f4SDimitry Andric   // after fclose if the python program keeps a reference to the file after
1533480093f4SDimitry Andric   // the original lldb_private::File has been destructed.
1534480093f4SDimitry Andric   //
1535480093f4SDimitry Andric   // It's all well and good to ask a python program not to use a closed file
1536480093f4SDimitry Andric   // but asking a python program to make sure objects get released in a
1537480093f4SDimitry Andric   // particular order is not safe.
1538480093f4SDimitry Andric   //
1539480093f4SDimitry Andric   // The tradeoff here is that if a python 2 program wants to make sure this
1540480093f4SDimitry Andric   // file gets flushed, they'll have to do it explicitly or wait untill the
1541480093f4SDimitry Andric   // original lldb File itself gets flushed.
1542480093f4SDimitry Andric   file_obj = PyFile_FromFile(file.GetStream(), py2_const_cast(""),
1543480093f4SDimitry Andric                              py2_const_cast(mode), [](FILE *) { return 0; });
15440b57cec5SDimitry Andric #endif
15459dba64beSDimitry Andric 
15469dba64beSDimitry Andric   if (!file_obj)
15479dba64beSDimitry Andric     return exception();
15489dba64beSDimitry Andric 
15499dba64beSDimitry Andric   return Take<PythonFile>(file_obj);
15500b57cec5SDimitry Andric }
15510b57cec5SDimitry Andric 
15529dba64beSDimitry Andric Error PythonScript::Init() {
15539dba64beSDimitry Andric   if (function.IsValid())
15549dba64beSDimitry Andric     return Error::success();
15550b57cec5SDimitry Andric 
15569dba64beSDimitry Andric   PythonDictionary globals(PyInitialValue::Empty);
15579dba64beSDimitry Andric   auto builtins = PythonModule::BuiltinsModule();
15589dba64beSDimitry Andric   if (Error error = globals.SetItem("__builtins__", builtins))
15599dba64beSDimitry Andric     return error;
15609dba64beSDimitry Andric   PyObject *o =
15619dba64beSDimitry Andric       PyRun_String(script, Py_file_input, globals.get(), globals.get());
15629dba64beSDimitry Andric   if (!o)
15639dba64beSDimitry Andric     return exception();
15649dba64beSDimitry Andric   Take<PythonObject>(o);
15659dba64beSDimitry Andric   auto f = As<PythonCallable>(globals.GetItem("main"));
15669dba64beSDimitry Andric   if (!f)
15679dba64beSDimitry Andric     return f.takeError();
15689dba64beSDimitry Andric   function = std::move(f.get());
15699dba64beSDimitry Andric 
15709dba64beSDimitry Andric   return Error::success();
15710b57cec5SDimitry Andric }
15720b57cec5SDimitry Andric 
15739dba64beSDimitry Andric llvm::Expected<PythonObject>
15749dba64beSDimitry Andric python::runStringOneLine(const llvm::Twine &string,
15759dba64beSDimitry Andric                          const PythonDictionary &globals,
15769dba64beSDimitry Andric                          const PythonDictionary &locals) {
15779dba64beSDimitry Andric   if (!globals.IsValid() || !locals.IsValid())
15789dba64beSDimitry Andric     return nullDeref();
15790b57cec5SDimitry Andric 
15809dba64beSDimitry Andric   PyObject *code =
15819dba64beSDimitry Andric       Py_CompileString(NullTerminated(string), "<string>", Py_eval_input);
15829dba64beSDimitry Andric   if (!code) {
15839dba64beSDimitry Andric     PyErr_Clear();
15849dba64beSDimitry Andric     code =
15859dba64beSDimitry Andric         Py_CompileString(NullTerminated(string), "<string>", Py_single_input);
15869dba64beSDimitry Andric   }
15879dba64beSDimitry Andric   if (!code)
15889dba64beSDimitry Andric     return exception();
15899dba64beSDimitry Andric   auto code_ref = Take<PythonObject>(code);
15909dba64beSDimitry Andric 
15919dba64beSDimitry Andric #if PY_MAJOR_VERSION < 3
15929dba64beSDimitry Andric   PyObject *result =
15939dba64beSDimitry Andric       PyEval_EvalCode((PyCodeObject *)code, globals.get(), locals.get());
15949dba64beSDimitry Andric #else
15959dba64beSDimitry Andric   PyObject *result = PyEval_EvalCode(code, globals.get(), locals.get());
15969dba64beSDimitry Andric #endif
15979dba64beSDimitry Andric 
15989dba64beSDimitry Andric   if (!result)
15999dba64beSDimitry Andric     return exception();
16009dba64beSDimitry Andric 
16019dba64beSDimitry Andric   return Take<PythonObject>(result);
16029dba64beSDimitry Andric }
16039dba64beSDimitry Andric 
16049dba64beSDimitry Andric llvm::Expected<PythonObject>
16059dba64beSDimitry Andric python::runStringMultiLine(const llvm::Twine &string,
16069dba64beSDimitry Andric                            const PythonDictionary &globals,
16079dba64beSDimitry Andric                            const PythonDictionary &locals) {
16089dba64beSDimitry Andric   if (!globals.IsValid() || !locals.IsValid())
16099dba64beSDimitry Andric     return nullDeref();
16109dba64beSDimitry Andric   PyObject *result = PyRun_String(NullTerminated(string), Py_file_input,
16119dba64beSDimitry Andric                                   globals.get(), locals.get());
16129dba64beSDimitry Andric   if (!result)
16139dba64beSDimitry Andric     return exception();
16149dba64beSDimitry Andric   return Take<PythonObject>(result);
16150b57cec5SDimitry Andric }
16160b57cec5SDimitry Andric 
16170b57cec5SDimitry Andric #endif
1618