15ffd83dbSDimitry Andric //===-- PythonDataObjects.cpp ---------------------------------------------===// 2*0b57cec5SDimitry Andric // 3*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 5*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6*0b57cec5SDimitry Andric // 7*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 8*0b57cec5SDimitry Andric 9480093f4SDimitry Andric #include "lldb/Host/Config.h" 10*0b57cec5SDimitry Andric 11480093f4SDimitry Andric #if LLDB_ENABLE_PYTHON 12*0b57cec5SDimitry Andric 13*0b57cec5SDimitry Andric #include "PythonDataObjects.h" 14*0b57cec5SDimitry Andric #include "ScriptInterpreterPython.h" 15*0b57cec5SDimitry Andric 16*0b57cec5SDimitry Andric #include "lldb/Host/File.h" 17*0b57cec5SDimitry Andric #include "lldb/Host/FileSystem.h" 18*0b57cec5SDimitry Andric #include "lldb/Interpreter/ScriptInterpreter.h" 199dba64beSDimitry Andric #include "lldb/Utility/Log.h" 20*0b57cec5SDimitry Andric #include "lldb/Utility/Stream.h" 21*0b57cec5SDimitry Andric 22*0b57cec5SDimitry Andric #include "llvm/ADT/StringSwitch.h" 239dba64beSDimitry Andric #include "llvm/Support/Casting.h" 24*0b57cec5SDimitry Andric #include "llvm/Support/ConvertUTF.h" 25*0b57cec5SDimitry Andric #include "llvm/Support/Errno.h" 26*0b57cec5SDimitry Andric 27fe6060f1SDimitry Andric #include <cstdio> 28*0b57cec5SDimitry Andric 29*0b57cec5SDimitry Andric using namespace lldb_private; 30*0b57cec5SDimitry Andric using namespace lldb; 319dba64beSDimitry Andric using namespace lldb_private::python; 329dba64beSDimitry Andric using llvm::cantFail; 339dba64beSDimitry Andric using llvm::Error; 349dba64beSDimitry Andric using llvm::Expected; 359dba64beSDimitry Andric using llvm::Twine; 36*0b57cec5SDimitry Andric 379dba64beSDimitry Andric template <> Expected<bool> python::As<bool>(Expected<PythonObject> &&obj) { 389dba64beSDimitry Andric if (!obj) 399dba64beSDimitry Andric return obj.takeError(); 409dba64beSDimitry Andric return obj.get().IsTrue(); 419dba64beSDimitry Andric } 429dba64beSDimitry Andric 439dba64beSDimitry Andric template <> 449dba64beSDimitry Andric Expected<long long> python::As<long long>(Expected<PythonObject> &&obj) { 459dba64beSDimitry Andric if (!obj) 469dba64beSDimitry Andric return obj.takeError(); 475ffd83dbSDimitry Andric return obj->AsLongLong(); 485ffd83dbSDimitry Andric } 495ffd83dbSDimitry Andric 505ffd83dbSDimitry Andric template <> 515ffd83dbSDimitry Andric Expected<unsigned long long> 525ffd83dbSDimitry Andric python::As<unsigned long long>(Expected<PythonObject> &&obj) { 535ffd83dbSDimitry Andric if (!obj) 545ffd83dbSDimitry Andric return obj.takeError(); 555ffd83dbSDimitry Andric return obj->AsUnsignedLongLong(); 569dba64beSDimitry Andric } 579dba64beSDimitry Andric 589dba64beSDimitry Andric template <> 599dba64beSDimitry Andric Expected<std::string> python::As<std::string>(Expected<PythonObject> &&obj) { 609dba64beSDimitry Andric if (!obj) 619dba64beSDimitry Andric return obj.takeError(); 629dba64beSDimitry Andric PyObject *str_obj = PyObject_Str(obj.get().get()); 639dba64beSDimitry Andric if (!obj) 649dba64beSDimitry Andric return llvm::make_error<PythonException>(); 659dba64beSDimitry Andric auto str = Take<PythonString>(str_obj); 669dba64beSDimitry Andric auto utf8 = str.AsUTF8(); 679dba64beSDimitry Andric if (!utf8) 689dba64beSDimitry Andric return utf8.takeError(); 695ffd83dbSDimitry Andric return std::string(utf8.get()); 705ffd83dbSDimitry Andric } 715ffd83dbSDimitry Andric 725ffd83dbSDimitry Andric Expected<long long> PythonObject::AsLongLong() const { 735ffd83dbSDimitry Andric if (!m_py_obj) 745ffd83dbSDimitry Andric return nullDeref(); 755ffd83dbSDimitry Andric #if PY_MAJOR_VERSION < 3 765ffd83dbSDimitry Andric if (!PyLong_Check(m_py_obj)) { 775ffd83dbSDimitry Andric PythonInteger i(PyRefType::Borrowed, m_py_obj); 785ffd83dbSDimitry Andric return i.AsLongLong(); 795ffd83dbSDimitry Andric } 805ffd83dbSDimitry Andric #endif 815ffd83dbSDimitry Andric assert(!PyErr_Occurred()); 825ffd83dbSDimitry Andric long long r = PyLong_AsLongLong(m_py_obj); 835ffd83dbSDimitry Andric if (PyErr_Occurred()) 845ffd83dbSDimitry Andric return exception(); 855ffd83dbSDimitry Andric return r; 865ffd83dbSDimitry Andric } 875ffd83dbSDimitry Andric 885ffd83dbSDimitry Andric Expected<long long> PythonObject::AsUnsignedLongLong() const { 895ffd83dbSDimitry Andric if (!m_py_obj) 905ffd83dbSDimitry Andric return nullDeref(); 915ffd83dbSDimitry Andric #if PY_MAJOR_VERSION < 3 925ffd83dbSDimitry Andric if (!PyLong_Check(m_py_obj)) { 935ffd83dbSDimitry Andric PythonInteger i(PyRefType::Borrowed, m_py_obj); 945ffd83dbSDimitry Andric return i.AsUnsignedLongLong(); 955ffd83dbSDimitry Andric } 965ffd83dbSDimitry Andric #endif 975ffd83dbSDimitry Andric assert(!PyErr_Occurred()); 985ffd83dbSDimitry Andric long long r = PyLong_AsUnsignedLongLong(m_py_obj); 995ffd83dbSDimitry Andric if (PyErr_Occurred()) 1005ffd83dbSDimitry Andric return exception(); 1015ffd83dbSDimitry Andric return r; 1025ffd83dbSDimitry Andric } 1035ffd83dbSDimitry Andric 1045ffd83dbSDimitry Andric // wraps on overflow, instead of raising an error. 1055ffd83dbSDimitry Andric Expected<unsigned long long> PythonObject::AsModuloUnsignedLongLong() const { 1065ffd83dbSDimitry Andric if (!m_py_obj) 1075ffd83dbSDimitry Andric return nullDeref(); 1085ffd83dbSDimitry Andric #if PY_MAJOR_VERSION < 3 1095ffd83dbSDimitry Andric if (!PyLong_Check(m_py_obj)) { 1105ffd83dbSDimitry Andric PythonInteger i(PyRefType::Borrowed, m_py_obj); 1115ffd83dbSDimitry Andric return i.AsModuloUnsignedLongLong(); 1125ffd83dbSDimitry Andric } 1135ffd83dbSDimitry Andric #endif 1145ffd83dbSDimitry Andric assert(!PyErr_Occurred()); 1155ffd83dbSDimitry Andric unsigned long long r = PyLong_AsUnsignedLongLongMask(m_py_obj); 1165ffd83dbSDimitry Andric if (PyErr_Occurred()) 1175ffd83dbSDimitry Andric return exception(); 1185ffd83dbSDimitry Andric return r; 1199dba64beSDimitry Andric } 1209dba64beSDimitry Andric 1219dba64beSDimitry Andric void StructuredPythonObject::Serialize(llvm::json::OStream &s) const { 1229dba64beSDimitry Andric s.value(llvm::formatv("Python Obj: {0:X}", GetValue()).str()); 123*0b57cec5SDimitry Andric } 124*0b57cec5SDimitry Andric 125*0b57cec5SDimitry Andric // PythonObject 126*0b57cec5SDimitry Andric 127*0b57cec5SDimitry Andric void PythonObject::Dump(Stream &strm) const { 128*0b57cec5SDimitry Andric if (m_py_obj) { 129*0b57cec5SDimitry Andric FILE *file = llvm::sys::RetryAfterSignal(nullptr, ::tmpfile); 130*0b57cec5SDimitry Andric if (file) { 131*0b57cec5SDimitry Andric ::PyObject_Print(m_py_obj, file, 0); 132*0b57cec5SDimitry Andric const long length = ftell(file); 133*0b57cec5SDimitry Andric if (length) { 134*0b57cec5SDimitry Andric ::rewind(file); 135*0b57cec5SDimitry Andric std::vector<char> file_contents(length, '\0'); 136*0b57cec5SDimitry Andric const size_t length_read = 137*0b57cec5SDimitry Andric ::fread(file_contents.data(), 1, file_contents.size(), file); 138*0b57cec5SDimitry Andric if (length_read > 0) 139*0b57cec5SDimitry Andric strm.Write(file_contents.data(), length_read); 140*0b57cec5SDimitry Andric } 141*0b57cec5SDimitry Andric ::fclose(file); 142*0b57cec5SDimitry Andric } 143*0b57cec5SDimitry Andric } else 144*0b57cec5SDimitry Andric strm.PutCString("NULL"); 145*0b57cec5SDimitry Andric } 146*0b57cec5SDimitry Andric 147*0b57cec5SDimitry Andric PyObjectType PythonObject::GetObjectType() const { 148*0b57cec5SDimitry Andric if (!IsAllocated()) 149*0b57cec5SDimitry Andric return PyObjectType::None; 150*0b57cec5SDimitry Andric 151*0b57cec5SDimitry Andric if (PythonModule::Check(m_py_obj)) 152*0b57cec5SDimitry Andric return PyObjectType::Module; 153*0b57cec5SDimitry Andric if (PythonList::Check(m_py_obj)) 154*0b57cec5SDimitry Andric return PyObjectType::List; 155*0b57cec5SDimitry Andric if (PythonTuple::Check(m_py_obj)) 156*0b57cec5SDimitry Andric return PyObjectType::Tuple; 157*0b57cec5SDimitry Andric if (PythonDictionary::Check(m_py_obj)) 158*0b57cec5SDimitry Andric return PyObjectType::Dictionary; 159*0b57cec5SDimitry Andric if (PythonString::Check(m_py_obj)) 160*0b57cec5SDimitry Andric return PyObjectType::String; 161*0b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 162*0b57cec5SDimitry Andric if (PythonBytes::Check(m_py_obj)) 163*0b57cec5SDimitry Andric return PyObjectType::Bytes; 164*0b57cec5SDimitry Andric #endif 165*0b57cec5SDimitry Andric if (PythonByteArray::Check(m_py_obj)) 166*0b57cec5SDimitry Andric return PyObjectType::ByteArray; 167*0b57cec5SDimitry Andric if (PythonBoolean::Check(m_py_obj)) 168*0b57cec5SDimitry Andric return PyObjectType::Boolean; 169*0b57cec5SDimitry Andric if (PythonInteger::Check(m_py_obj)) 170*0b57cec5SDimitry Andric return PyObjectType::Integer; 171*0b57cec5SDimitry Andric if (PythonFile::Check(m_py_obj)) 172*0b57cec5SDimitry Andric return PyObjectType::File; 173*0b57cec5SDimitry Andric if (PythonCallable::Check(m_py_obj)) 174*0b57cec5SDimitry Andric return PyObjectType::Callable; 175*0b57cec5SDimitry Andric return PyObjectType::Unknown; 176*0b57cec5SDimitry Andric } 177*0b57cec5SDimitry Andric 178*0b57cec5SDimitry Andric PythonString PythonObject::Repr() const { 179*0b57cec5SDimitry Andric if (!m_py_obj) 180*0b57cec5SDimitry Andric return PythonString(); 181*0b57cec5SDimitry Andric PyObject *repr = PyObject_Repr(m_py_obj); 182*0b57cec5SDimitry Andric if (!repr) 183*0b57cec5SDimitry Andric return PythonString(); 184*0b57cec5SDimitry Andric return PythonString(PyRefType::Owned, repr); 185*0b57cec5SDimitry Andric } 186*0b57cec5SDimitry Andric 187*0b57cec5SDimitry Andric PythonString PythonObject::Str() const { 188*0b57cec5SDimitry Andric if (!m_py_obj) 189*0b57cec5SDimitry Andric return PythonString(); 190*0b57cec5SDimitry Andric PyObject *str = PyObject_Str(m_py_obj); 191*0b57cec5SDimitry Andric if (!str) 192*0b57cec5SDimitry Andric return PythonString(); 193*0b57cec5SDimitry Andric return PythonString(PyRefType::Owned, str); 194*0b57cec5SDimitry Andric } 195*0b57cec5SDimitry Andric 196*0b57cec5SDimitry Andric PythonObject 197*0b57cec5SDimitry Andric PythonObject::ResolveNameWithDictionary(llvm::StringRef name, 198*0b57cec5SDimitry Andric const PythonDictionary &dict) { 199*0b57cec5SDimitry Andric size_t dot_pos = name.find('.'); 200*0b57cec5SDimitry Andric llvm::StringRef piece = name.substr(0, dot_pos); 201*0b57cec5SDimitry Andric PythonObject result = dict.GetItemForKey(PythonString(piece)); 202*0b57cec5SDimitry Andric if (dot_pos == llvm::StringRef::npos) { 203*0b57cec5SDimitry Andric // There was no dot, we're done. 204*0b57cec5SDimitry Andric return result; 205*0b57cec5SDimitry Andric } 206*0b57cec5SDimitry Andric 207*0b57cec5SDimitry Andric // There was a dot. The remaining portion of the name should be looked up in 208*0b57cec5SDimitry Andric // the context of the object that was found in the dictionary. 209*0b57cec5SDimitry Andric return result.ResolveName(name.substr(dot_pos + 1)); 210*0b57cec5SDimitry Andric } 211*0b57cec5SDimitry Andric 212*0b57cec5SDimitry Andric PythonObject PythonObject::ResolveName(llvm::StringRef name) const { 213*0b57cec5SDimitry Andric // Resolve the name in the context of the specified object. If, for example, 214*0b57cec5SDimitry Andric // `this` refers to a PyModule, then this will look for `name` in this 215*0b57cec5SDimitry Andric // module. If `this` refers to a PyType, then it will resolve `name` as an 216*0b57cec5SDimitry Andric // attribute of that type. If `this` refers to an instance of an object, 217*0b57cec5SDimitry Andric // then it will resolve `name` as the value of the specified field. 218*0b57cec5SDimitry Andric // 219*0b57cec5SDimitry Andric // This function handles dotted names so that, for example, if `m_py_obj` 220*0b57cec5SDimitry Andric // refers to the `sys` module, and `name` == "path.append", then it will find 221*0b57cec5SDimitry Andric // the function `sys.path.append`. 222*0b57cec5SDimitry Andric 223*0b57cec5SDimitry Andric size_t dot_pos = name.find('.'); 224*0b57cec5SDimitry Andric if (dot_pos == llvm::StringRef::npos) { 225*0b57cec5SDimitry Andric // No dots in the name, we should be able to find the value immediately as 226*0b57cec5SDimitry Andric // an attribute of `m_py_obj`. 227*0b57cec5SDimitry Andric return GetAttributeValue(name); 228*0b57cec5SDimitry Andric } 229*0b57cec5SDimitry Andric 230*0b57cec5SDimitry Andric // Look up the first piece of the name, and resolve the rest as a child of 231*0b57cec5SDimitry Andric // that. 232*0b57cec5SDimitry Andric PythonObject parent = ResolveName(name.substr(0, dot_pos)); 233*0b57cec5SDimitry Andric if (!parent.IsAllocated()) 234*0b57cec5SDimitry Andric return PythonObject(); 235*0b57cec5SDimitry Andric 236*0b57cec5SDimitry Andric // Tail recursion.. should be optimized by the compiler 237*0b57cec5SDimitry Andric return parent.ResolveName(name.substr(dot_pos + 1)); 238*0b57cec5SDimitry Andric } 239*0b57cec5SDimitry Andric 240*0b57cec5SDimitry Andric bool PythonObject::HasAttribute(llvm::StringRef attr) const { 241*0b57cec5SDimitry Andric if (!IsValid()) 242*0b57cec5SDimitry Andric return false; 243*0b57cec5SDimitry Andric PythonString py_attr(attr); 244*0b57cec5SDimitry Andric return !!PyObject_HasAttr(m_py_obj, py_attr.get()); 245*0b57cec5SDimitry Andric } 246*0b57cec5SDimitry Andric 247*0b57cec5SDimitry Andric PythonObject PythonObject::GetAttributeValue(llvm::StringRef attr) const { 248*0b57cec5SDimitry Andric if (!IsValid()) 249*0b57cec5SDimitry Andric return PythonObject(); 250*0b57cec5SDimitry Andric 251*0b57cec5SDimitry Andric PythonString py_attr(attr); 252*0b57cec5SDimitry Andric if (!PyObject_HasAttr(m_py_obj, py_attr.get())) 253*0b57cec5SDimitry Andric return PythonObject(); 254*0b57cec5SDimitry Andric 255*0b57cec5SDimitry Andric return PythonObject(PyRefType::Owned, 256*0b57cec5SDimitry Andric PyObject_GetAttr(m_py_obj, py_attr.get())); 257*0b57cec5SDimitry Andric } 258*0b57cec5SDimitry Andric 259*0b57cec5SDimitry Andric StructuredData::ObjectSP PythonObject::CreateStructuredObject() const { 260*0b57cec5SDimitry Andric switch (GetObjectType()) { 261*0b57cec5SDimitry Andric case PyObjectType::Dictionary: 262*0b57cec5SDimitry Andric return PythonDictionary(PyRefType::Borrowed, m_py_obj) 263*0b57cec5SDimitry Andric .CreateStructuredDictionary(); 264*0b57cec5SDimitry Andric case PyObjectType::Boolean: 265*0b57cec5SDimitry Andric return PythonBoolean(PyRefType::Borrowed, m_py_obj) 266*0b57cec5SDimitry Andric .CreateStructuredBoolean(); 267*0b57cec5SDimitry Andric case PyObjectType::Integer: 268*0b57cec5SDimitry Andric return PythonInteger(PyRefType::Borrowed, m_py_obj) 269*0b57cec5SDimitry Andric .CreateStructuredInteger(); 270*0b57cec5SDimitry Andric case PyObjectType::List: 271*0b57cec5SDimitry Andric return PythonList(PyRefType::Borrowed, m_py_obj).CreateStructuredArray(); 272*0b57cec5SDimitry Andric case PyObjectType::String: 273*0b57cec5SDimitry Andric return PythonString(PyRefType::Borrowed, m_py_obj).CreateStructuredString(); 274*0b57cec5SDimitry Andric case PyObjectType::Bytes: 275*0b57cec5SDimitry Andric return PythonBytes(PyRefType::Borrowed, m_py_obj).CreateStructuredString(); 276*0b57cec5SDimitry Andric case PyObjectType::ByteArray: 277*0b57cec5SDimitry Andric return PythonByteArray(PyRefType::Borrowed, m_py_obj) 278*0b57cec5SDimitry Andric .CreateStructuredString(); 279*0b57cec5SDimitry Andric case PyObjectType::None: 280*0b57cec5SDimitry Andric return StructuredData::ObjectSP(); 281*0b57cec5SDimitry Andric default: 282*0b57cec5SDimitry Andric return StructuredData::ObjectSP(new StructuredPythonObject(m_py_obj)); 283*0b57cec5SDimitry Andric } 284*0b57cec5SDimitry Andric } 285*0b57cec5SDimitry Andric 286*0b57cec5SDimitry Andric // PythonString 287*0b57cec5SDimitry Andric 2889dba64beSDimitry Andric PythonBytes::PythonBytes(llvm::ArrayRef<uint8_t> bytes) { SetBytes(bytes); } 289*0b57cec5SDimitry Andric 2909dba64beSDimitry Andric PythonBytes::PythonBytes(const uint8_t *bytes, size_t length) { 291*0b57cec5SDimitry Andric SetBytes(llvm::ArrayRef<uint8_t>(bytes, length)); 292*0b57cec5SDimitry Andric } 293*0b57cec5SDimitry Andric 294*0b57cec5SDimitry Andric bool PythonBytes::Check(PyObject *py_obj) { 295*0b57cec5SDimitry Andric if (!py_obj) 296*0b57cec5SDimitry Andric return false; 297*0b57cec5SDimitry Andric return PyBytes_Check(py_obj); 298*0b57cec5SDimitry Andric } 299*0b57cec5SDimitry Andric 300*0b57cec5SDimitry Andric llvm::ArrayRef<uint8_t> PythonBytes::GetBytes() const { 301*0b57cec5SDimitry Andric if (!IsValid()) 302*0b57cec5SDimitry Andric return llvm::ArrayRef<uint8_t>(); 303*0b57cec5SDimitry Andric 304*0b57cec5SDimitry Andric Py_ssize_t size; 305*0b57cec5SDimitry Andric char *c; 306*0b57cec5SDimitry Andric 307*0b57cec5SDimitry Andric PyBytes_AsStringAndSize(m_py_obj, &c, &size); 308*0b57cec5SDimitry Andric return llvm::ArrayRef<uint8_t>(reinterpret_cast<uint8_t *>(c), size); 309*0b57cec5SDimitry Andric } 310*0b57cec5SDimitry Andric 311*0b57cec5SDimitry Andric size_t PythonBytes::GetSize() const { 312*0b57cec5SDimitry Andric if (!IsValid()) 313*0b57cec5SDimitry Andric return 0; 314*0b57cec5SDimitry Andric return PyBytes_Size(m_py_obj); 315*0b57cec5SDimitry Andric } 316*0b57cec5SDimitry Andric 317*0b57cec5SDimitry Andric void PythonBytes::SetBytes(llvm::ArrayRef<uint8_t> bytes) { 318*0b57cec5SDimitry Andric const char *data = reinterpret_cast<const char *>(bytes.data()); 3199dba64beSDimitry Andric *this = Take<PythonBytes>(PyBytes_FromStringAndSize(data, bytes.size())); 320*0b57cec5SDimitry Andric } 321*0b57cec5SDimitry Andric 322*0b57cec5SDimitry Andric StructuredData::StringSP PythonBytes::CreateStructuredString() const { 323*0b57cec5SDimitry Andric StructuredData::StringSP result(new StructuredData::String); 324*0b57cec5SDimitry Andric Py_ssize_t size; 325*0b57cec5SDimitry Andric char *c; 326*0b57cec5SDimitry Andric PyBytes_AsStringAndSize(m_py_obj, &c, &size); 327*0b57cec5SDimitry Andric result->SetValue(std::string(c, size)); 328*0b57cec5SDimitry Andric return result; 329*0b57cec5SDimitry Andric } 330*0b57cec5SDimitry Andric 331*0b57cec5SDimitry Andric PythonByteArray::PythonByteArray(llvm::ArrayRef<uint8_t> bytes) 332*0b57cec5SDimitry Andric : PythonByteArray(bytes.data(), bytes.size()) {} 333*0b57cec5SDimitry Andric 334*0b57cec5SDimitry Andric PythonByteArray::PythonByteArray(const uint8_t *bytes, size_t length) { 335*0b57cec5SDimitry Andric const char *str = reinterpret_cast<const char *>(bytes); 3369dba64beSDimitry Andric *this = Take<PythonByteArray>(PyByteArray_FromStringAndSize(str, length)); 337*0b57cec5SDimitry Andric } 338*0b57cec5SDimitry Andric 339*0b57cec5SDimitry Andric bool PythonByteArray::Check(PyObject *py_obj) { 340*0b57cec5SDimitry Andric if (!py_obj) 341*0b57cec5SDimitry Andric return false; 342*0b57cec5SDimitry Andric return PyByteArray_Check(py_obj); 343*0b57cec5SDimitry Andric } 344*0b57cec5SDimitry Andric 345*0b57cec5SDimitry Andric llvm::ArrayRef<uint8_t> PythonByteArray::GetBytes() const { 346*0b57cec5SDimitry Andric if (!IsValid()) 347*0b57cec5SDimitry Andric return llvm::ArrayRef<uint8_t>(); 348*0b57cec5SDimitry Andric 349*0b57cec5SDimitry Andric char *c = PyByteArray_AsString(m_py_obj); 350*0b57cec5SDimitry Andric size_t size = GetSize(); 351*0b57cec5SDimitry Andric return llvm::ArrayRef<uint8_t>(reinterpret_cast<uint8_t *>(c), size); 352*0b57cec5SDimitry Andric } 353*0b57cec5SDimitry Andric 354*0b57cec5SDimitry Andric size_t PythonByteArray::GetSize() const { 355*0b57cec5SDimitry Andric if (!IsValid()) 356*0b57cec5SDimitry Andric return 0; 357*0b57cec5SDimitry Andric 358*0b57cec5SDimitry Andric return PyByteArray_Size(m_py_obj); 359*0b57cec5SDimitry Andric } 360*0b57cec5SDimitry Andric 361*0b57cec5SDimitry Andric StructuredData::StringSP PythonByteArray::CreateStructuredString() const { 362*0b57cec5SDimitry Andric StructuredData::StringSP result(new StructuredData::String); 363*0b57cec5SDimitry Andric llvm::ArrayRef<uint8_t> bytes = GetBytes(); 364*0b57cec5SDimitry Andric const char *str = reinterpret_cast<const char *>(bytes.data()); 365*0b57cec5SDimitry Andric result->SetValue(std::string(str, bytes.size())); 366*0b57cec5SDimitry Andric return result; 367*0b57cec5SDimitry Andric } 368*0b57cec5SDimitry Andric 369*0b57cec5SDimitry Andric // PythonString 370*0b57cec5SDimitry Andric 3719dba64beSDimitry Andric Expected<PythonString> PythonString::FromUTF8(llvm::StringRef string) { 3729dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 3739dba64beSDimitry Andric PyObject *str = PyUnicode_FromStringAndSize(string.data(), string.size()); 3749dba64beSDimitry Andric #else 3759dba64beSDimitry Andric PyObject *str = PyString_FromStringAndSize(string.data(), string.size()); 3769dba64beSDimitry Andric #endif 3779dba64beSDimitry Andric if (!str) 3789dba64beSDimitry Andric return llvm::make_error<PythonException>(); 3799dba64beSDimitry Andric return Take<PythonString>(str); 380*0b57cec5SDimitry Andric } 381*0b57cec5SDimitry Andric 3829dba64beSDimitry Andric PythonString::PythonString(llvm::StringRef string) { SetString(string); } 383*0b57cec5SDimitry Andric 384*0b57cec5SDimitry Andric bool PythonString::Check(PyObject *py_obj) { 385*0b57cec5SDimitry Andric if (!py_obj) 386*0b57cec5SDimitry Andric return false; 387*0b57cec5SDimitry Andric 388*0b57cec5SDimitry Andric if (PyUnicode_Check(py_obj)) 389*0b57cec5SDimitry Andric return true; 390*0b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3 391*0b57cec5SDimitry Andric if (PyString_Check(py_obj)) 392*0b57cec5SDimitry Andric return true; 393*0b57cec5SDimitry Andric #endif 394*0b57cec5SDimitry Andric return false; 395*0b57cec5SDimitry Andric } 396*0b57cec5SDimitry Andric 3979dba64beSDimitry Andric void PythonString::Convert(PyRefType &type, PyObject *&py_obj) { 398*0b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3 399*0b57cec5SDimitry Andric // In Python 2, Don't store PyUnicode objects directly, because we need 400*0b57cec5SDimitry Andric // access to their underlying character buffers which Python 2 doesn't 401*0b57cec5SDimitry Andric // provide. 4029dba64beSDimitry Andric if (PyUnicode_Check(py_obj)) { 4039dba64beSDimitry Andric PyObject *s = PyUnicode_AsUTF8String(py_obj); 4049dba64beSDimitry Andric if (s == nullptr) { 4059dba64beSDimitry Andric PyErr_Clear(); 4069dba64beSDimitry Andric if (type == PyRefType::Owned) 4079dba64beSDimitry Andric Py_DECREF(py_obj); 4089dba64beSDimitry Andric return; 4099dba64beSDimitry Andric } 4109dba64beSDimitry Andric if (type == PyRefType::Owned) 4119dba64beSDimitry Andric Py_DECREF(py_obj); 4129dba64beSDimitry Andric else 4139dba64beSDimitry Andric type = PyRefType::Owned; 4149dba64beSDimitry Andric py_obj = s; 4159dba64beSDimitry Andric } 416*0b57cec5SDimitry Andric #endif 417*0b57cec5SDimitry Andric } 418*0b57cec5SDimitry Andric 419*0b57cec5SDimitry Andric llvm::StringRef PythonString::GetString() const { 4209dba64beSDimitry Andric auto s = AsUTF8(); 4219dba64beSDimitry Andric if (!s) { 4229dba64beSDimitry Andric llvm::consumeError(s.takeError()); 4239dba64beSDimitry Andric return llvm::StringRef(""); 4249dba64beSDimitry Andric } 4259dba64beSDimitry Andric return s.get(); 4269dba64beSDimitry Andric } 4279dba64beSDimitry Andric 4289dba64beSDimitry Andric Expected<llvm::StringRef> PythonString::AsUTF8() const { 429*0b57cec5SDimitry Andric if (!IsValid()) 4309dba64beSDimitry Andric return nullDeref(); 431*0b57cec5SDimitry Andric 432*0b57cec5SDimitry Andric Py_ssize_t size; 433*0b57cec5SDimitry Andric const char *data; 434*0b57cec5SDimitry Andric 435*0b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 436*0b57cec5SDimitry Andric data = PyUnicode_AsUTF8AndSize(m_py_obj, &size); 437*0b57cec5SDimitry Andric #else 4389dba64beSDimitry Andric char *c = NULL; 4399dba64beSDimitry Andric int r = PyString_AsStringAndSize(m_py_obj, &c, &size); 4409dba64beSDimitry Andric if (r < 0) 4419dba64beSDimitry Andric c = NULL; 442*0b57cec5SDimitry Andric data = c; 443*0b57cec5SDimitry Andric #endif 4449dba64beSDimitry Andric 4459dba64beSDimitry Andric if (!data) 4469dba64beSDimitry Andric return exception(); 4479dba64beSDimitry Andric 448*0b57cec5SDimitry Andric return llvm::StringRef(data, size); 449*0b57cec5SDimitry Andric } 450*0b57cec5SDimitry Andric 451*0b57cec5SDimitry Andric size_t PythonString::GetSize() const { 452*0b57cec5SDimitry Andric if (IsValid()) { 453*0b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 454e8d8bef9SDimitry Andric #if PY_MINOR_VERSION >= 3 455e8d8bef9SDimitry Andric return PyUnicode_GetLength(m_py_obj); 456e8d8bef9SDimitry Andric #else 457*0b57cec5SDimitry Andric return PyUnicode_GetSize(m_py_obj); 458e8d8bef9SDimitry Andric #endif 459*0b57cec5SDimitry Andric #else 460*0b57cec5SDimitry Andric return PyString_Size(m_py_obj); 461*0b57cec5SDimitry Andric #endif 462*0b57cec5SDimitry Andric } 463*0b57cec5SDimitry Andric return 0; 464*0b57cec5SDimitry Andric } 465*0b57cec5SDimitry Andric 466*0b57cec5SDimitry Andric void PythonString::SetString(llvm::StringRef string) { 4679dba64beSDimitry Andric auto s = FromUTF8(string); 4689dba64beSDimitry Andric if (!s) { 4699dba64beSDimitry Andric llvm::consumeError(s.takeError()); 4709dba64beSDimitry Andric Reset(); 4719dba64beSDimitry Andric } else { 4729dba64beSDimitry Andric *this = std::move(s.get()); 4739dba64beSDimitry Andric } 474*0b57cec5SDimitry Andric } 475*0b57cec5SDimitry Andric 476*0b57cec5SDimitry Andric StructuredData::StringSP PythonString::CreateStructuredString() const { 477*0b57cec5SDimitry Andric StructuredData::StringSP result(new StructuredData::String); 478*0b57cec5SDimitry Andric result->SetValue(GetString()); 479*0b57cec5SDimitry Andric return result; 480*0b57cec5SDimitry Andric } 481*0b57cec5SDimitry Andric 482*0b57cec5SDimitry Andric // PythonInteger 483*0b57cec5SDimitry Andric 4849dba64beSDimitry Andric PythonInteger::PythonInteger(int64_t value) { SetInteger(value); } 485*0b57cec5SDimitry Andric 486*0b57cec5SDimitry Andric bool PythonInteger::Check(PyObject *py_obj) { 487*0b57cec5SDimitry Andric if (!py_obj) 488*0b57cec5SDimitry Andric return false; 489*0b57cec5SDimitry Andric 490*0b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 491*0b57cec5SDimitry Andric // Python 3 does not have PyInt_Check. There is only one type of integral 492*0b57cec5SDimitry Andric // value, long. 493*0b57cec5SDimitry Andric return PyLong_Check(py_obj); 494*0b57cec5SDimitry Andric #else 495*0b57cec5SDimitry Andric return PyLong_Check(py_obj) || PyInt_Check(py_obj); 496*0b57cec5SDimitry Andric #endif 497*0b57cec5SDimitry Andric } 498*0b57cec5SDimitry Andric 4999dba64beSDimitry Andric void PythonInteger::Convert(PyRefType &type, PyObject *&py_obj) { 500*0b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3 501*0b57cec5SDimitry Andric // Always store this as a PyLong, which makes interoperability between Python 502*0b57cec5SDimitry Andric // 2.x and Python 3.x easier. This is only necessary in 2.x, since 3.x 503*0b57cec5SDimitry Andric // doesn't even have a PyInt. 504*0b57cec5SDimitry Andric if (PyInt_Check(py_obj)) { 505*0b57cec5SDimitry Andric // Since we converted the original object to a different type, the new 506*0b57cec5SDimitry Andric // object is an owned object regardless of the ownership semantics 507*0b57cec5SDimitry Andric // requested by the user. 5089dba64beSDimitry Andric long long value = PyInt_AsLong(py_obj); 5099dba64beSDimitry Andric PyObject *l = nullptr; 5109dba64beSDimitry Andric if (!PyErr_Occurred()) 5119dba64beSDimitry Andric l = PyLong_FromLongLong(value); 5129dba64beSDimitry Andric if (l == nullptr) { 5139dba64beSDimitry Andric PyErr_Clear(); 5149dba64beSDimitry Andric if (type == PyRefType::Owned) 5159dba64beSDimitry Andric Py_DECREF(py_obj); 5169dba64beSDimitry Andric return; 5179dba64beSDimitry Andric } 5189dba64beSDimitry Andric if (type == PyRefType::Owned) 5199dba64beSDimitry Andric Py_DECREF(py_obj); 5209dba64beSDimitry Andric else 5219dba64beSDimitry Andric type = PyRefType::Owned; 5229dba64beSDimitry Andric py_obj = l; 523*0b57cec5SDimitry Andric } 524*0b57cec5SDimitry Andric #endif 525*0b57cec5SDimitry Andric } 526*0b57cec5SDimitry Andric 527*0b57cec5SDimitry Andric void PythonInteger::SetInteger(int64_t value) { 5289dba64beSDimitry Andric *this = Take<PythonInteger>(PyLong_FromLongLong(value)); 529*0b57cec5SDimitry Andric } 530*0b57cec5SDimitry Andric 531*0b57cec5SDimitry Andric StructuredData::IntegerSP PythonInteger::CreateStructuredInteger() const { 532*0b57cec5SDimitry Andric StructuredData::IntegerSP result(new StructuredData::Integer); 5335ffd83dbSDimitry Andric // FIXME this is really not ideal. Errors are silently converted to 0 5345ffd83dbSDimitry Andric // and overflows are silently wrapped. But we'd need larger changes 5355ffd83dbSDimitry Andric // to StructuredData to fix it, so that's how it is for now. 5365ffd83dbSDimitry Andric llvm::Expected<unsigned long long> value = AsModuloUnsignedLongLong(); 5375ffd83dbSDimitry Andric if (!value) { 5385ffd83dbSDimitry Andric llvm::consumeError(value.takeError()); 5395ffd83dbSDimitry Andric result->SetValue(0); 5405ffd83dbSDimitry Andric } else { 5415ffd83dbSDimitry Andric result->SetValue(value.get()); 5425ffd83dbSDimitry Andric } 543*0b57cec5SDimitry Andric return result; 544*0b57cec5SDimitry Andric } 545*0b57cec5SDimitry Andric 546*0b57cec5SDimitry Andric // PythonBoolean 547*0b57cec5SDimitry Andric 548*0b57cec5SDimitry Andric PythonBoolean::PythonBoolean(bool value) { 549*0b57cec5SDimitry Andric SetValue(value); 550*0b57cec5SDimitry Andric } 551*0b57cec5SDimitry Andric 552*0b57cec5SDimitry Andric bool PythonBoolean::Check(PyObject *py_obj) { 553*0b57cec5SDimitry Andric return py_obj ? PyBool_Check(py_obj) : false; 554*0b57cec5SDimitry Andric } 555*0b57cec5SDimitry Andric 556*0b57cec5SDimitry Andric bool PythonBoolean::GetValue() const { 557*0b57cec5SDimitry Andric return m_py_obj ? PyObject_IsTrue(m_py_obj) : false; 558*0b57cec5SDimitry Andric } 559*0b57cec5SDimitry Andric 560*0b57cec5SDimitry Andric void PythonBoolean::SetValue(bool value) { 5619dba64beSDimitry Andric *this = Take<PythonBoolean>(PyBool_FromLong(value)); 562*0b57cec5SDimitry Andric } 563*0b57cec5SDimitry Andric 564*0b57cec5SDimitry Andric StructuredData::BooleanSP PythonBoolean::CreateStructuredBoolean() const { 565*0b57cec5SDimitry Andric StructuredData::BooleanSP result(new StructuredData::Boolean); 566*0b57cec5SDimitry Andric result->SetValue(GetValue()); 567*0b57cec5SDimitry Andric return result; 568*0b57cec5SDimitry Andric } 569*0b57cec5SDimitry Andric 570*0b57cec5SDimitry Andric // PythonList 571*0b57cec5SDimitry Andric 5729dba64beSDimitry Andric PythonList::PythonList(PyInitialValue value) { 573*0b57cec5SDimitry Andric if (value == PyInitialValue::Empty) 5749dba64beSDimitry Andric *this = Take<PythonList>(PyList_New(0)); 575*0b57cec5SDimitry Andric } 576*0b57cec5SDimitry Andric 5779dba64beSDimitry Andric PythonList::PythonList(int list_size) { 5789dba64beSDimitry Andric *this = Take<PythonList>(PyList_New(list_size)); 579*0b57cec5SDimitry Andric } 580*0b57cec5SDimitry Andric 581*0b57cec5SDimitry Andric bool PythonList::Check(PyObject *py_obj) { 582*0b57cec5SDimitry Andric if (!py_obj) 583*0b57cec5SDimitry Andric return false; 584*0b57cec5SDimitry Andric return PyList_Check(py_obj); 585*0b57cec5SDimitry Andric } 586*0b57cec5SDimitry Andric 587*0b57cec5SDimitry Andric uint32_t PythonList::GetSize() const { 588*0b57cec5SDimitry Andric if (IsValid()) 589*0b57cec5SDimitry Andric return PyList_GET_SIZE(m_py_obj); 590*0b57cec5SDimitry Andric return 0; 591*0b57cec5SDimitry Andric } 592*0b57cec5SDimitry Andric 593*0b57cec5SDimitry Andric PythonObject PythonList::GetItemAtIndex(uint32_t index) const { 594*0b57cec5SDimitry Andric if (IsValid()) 595*0b57cec5SDimitry Andric return PythonObject(PyRefType::Borrowed, PyList_GetItem(m_py_obj, index)); 596*0b57cec5SDimitry Andric return PythonObject(); 597*0b57cec5SDimitry Andric } 598*0b57cec5SDimitry Andric 599*0b57cec5SDimitry Andric void PythonList::SetItemAtIndex(uint32_t index, const PythonObject &object) { 600*0b57cec5SDimitry Andric if (IsAllocated() && object.IsValid()) { 601*0b57cec5SDimitry Andric // PyList_SetItem is documented to "steal" a reference, so we need to 602*0b57cec5SDimitry Andric // convert it to an owned reference by incrementing it. 603*0b57cec5SDimitry Andric Py_INCREF(object.get()); 604*0b57cec5SDimitry Andric PyList_SetItem(m_py_obj, index, object.get()); 605*0b57cec5SDimitry Andric } 606*0b57cec5SDimitry Andric } 607*0b57cec5SDimitry Andric 608*0b57cec5SDimitry Andric void PythonList::AppendItem(const PythonObject &object) { 609*0b57cec5SDimitry Andric if (IsAllocated() && object.IsValid()) { 610*0b57cec5SDimitry Andric // `PyList_Append` does *not* steal a reference, so do not call `Py_INCREF` 611*0b57cec5SDimitry Andric // here like we do with `PyList_SetItem`. 612*0b57cec5SDimitry Andric PyList_Append(m_py_obj, object.get()); 613*0b57cec5SDimitry Andric } 614*0b57cec5SDimitry Andric } 615*0b57cec5SDimitry Andric 616*0b57cec5SDimitry Andric StructuredData::ArraySP PythonList::CreateStructuredArray() const { 617*0b57cec5SDimitry Andric StructuredData::ArraySP result(new StructuredData::Array); 618*0b57cec5SDimitry Andric uint32_t count = GetSize(); 619*0b57cec5SDimitry Andric for (uint32_t i = 0; i < count; ++i) { 620*0b57cec5SDimitry Andric PythonObject obj = GetItemAtIndex(i); 621*0b57cec5SDimitry Andric result->AddItem(obj.CreateStructuredObject()); 622*0b57cec5SDimitry Andric } 623*0b57cec5SDimitry Andric return result; 624*0b57cec5SDimitry Andric } 625*0b57cec5SDimitry Andric 626*0b57cec5SDimitry Andric // PythonTuple 627*0b57cec5SDimitry Andric 6289dba64beSDimitry Andric PythonTuple::PythonTuple(PyInitialValue value) { 629*0b57cec5SDimitry Andric if (value == PyInitialValue::Empty) 6309dba64beSDimitry Andric *this = Take<PythonTuple>(PyTuple_New(0)); 631*0b57cec5SDimitry Andric } 632*0b57cec5SDimitry Andric 6339dba64beSDimitry Andric PythonTuple::PythonTuple(int tuple_size) { 6349dba64beSDimitry Andric *this = Take<PythonTuple>(PyTuple_New(tuple_size)); 635*0b57cec5SDimitry Andric } 636*0b57cec5SDimitry Andric 637*0b57cec5SDimitry Andric PythonTuple::PythonTuple(std::initializer_list<PythonObject> objects) { 638*0b57cec5SDimitry Andric m_py_obj = PyTuple_New(objects.size()); 639*0b57cec5SDimitry Andric 640*0b57cec5SDimitry Andric uint32_t idx = 0; 641*0b57cec5SDimitry Andric for (auto object : objects) { 642*0b57cec5SDimitry Andric if (object.IsValid()) 643*0b57cec5SDimitry Andric SetItemAtIndex(idx, object); 644*0b57cec5SDimitry Andric idx++; 645*0b57cec5SDimitry Andric } 646*0b57cec5SDimitry Andric } 647*0b57cec5SDimitry Andric 648*0b57cec5SDimitry Andric PythonTuple::PythonTuple(std::initializer_list<PyObject *> objects) { 649*0b57cec5SDimitry Andric m_py_obj = PyTuple_New(objects.size()); 650*0b57cec5SDimitry Andric 651*0b57cec5SDimitry Andric uint32_t idx = 0; 652*0b57cec5SDimitry Andric for (auto py_object : objects) { 653*0b57cec5SDimitry Andric PythonObject object(PyRefType::Borrowed, py_object); 654*0b57cec5SDimitry Andric if (object.IsValid()) 655*0b57cec5SDimitry Andric SetItemAtIndex(idx, object); 656*0b57cec5SDimitry Andric idx++; 657*0b57cec5SDimitry Andric } 658*0b57cec5SDimitry Andric } 659*0b57cec5SDimitry Andric 660*0b57cec5SDimitry Andric bool PythonTuple::Check(PyObject *py_obj) { 661*0b57cec5SDimitry Andric if (!py_obj) 662*0b57cec5SDimitry Andric return false; 663*0b57cec5SDimitry Andric return PyTuple_Check(py_obj); 664*0b57cec5SDimitry Andric } 665*0b57cec5SDimitry Andric 666*0b57cec5SDimitry Andric uint32_t PythonTuple::GetSize() const { 667*0b57cec5SDimitry Andric if (IsValid()) 668*0b57cec5SDimitry Andric return PyTuple_GET_SIZE(m_py_obj); 669*0b57cec5SDimitry Andric return 0; 670*0b57cec5SDimitry Andric } 671*0b57cec5SDimitry Andric 672*0b57cec5SDimitry Andric PythonObject PythonTuple::GetItemAtIndex(uint32_t index) const { 673*0b57cec5SDimitry Andric if (IsValid()) 674*0b57cec5SDimitry Andric return PythonObject(PyRefType::Borrowed, PyTuple_GetItem(m_py_obj, index)); 675*0b57cec5SDimitry Andric return PythonObject(); 676*0b57cec5SDimitry Andric } 677*0b57cec5SDimitry Andric 678*0b57cec5SDimitry Andric void PythonTuple::SetItemAtIndex(uint32_t index, const PythonObject &object) { 679*0b57cec5SDimitry Andric if (IsAllocated() && object.IsValid()) { 680*0b57cec5SDimitry Andric // PyTuple_SetItem is documented to "steal" a reference, so we need to 681*0b57cec5SDimitry Andric // convert it to an owned reference by incrementing it. 682*0b57cec5SDimitry Andric Py_INCREF(object.get()); 683*0b57cec5SDimitry Andric PyTuple_SetItem(m_py_obj, index, object.get()); 684*0b57cec5SDimitry Andric } 685*0b57cec5SDimitry Andric } 686*0b57cec5SDimitry Andric 687*0b57cec5SDimitry Andric StructuredData::ArraySP PythonTuple::CreateStructuredArray() const { 688*0b57cec5SDimitry Andric StructuredData::ArraySP result(new StructuredData::Array); 689*0b57cec5SDimitry Andric uint32_t count = GetSize(); 690*0b57cec5SDimitry Andric for (uint32_t i = 0; i < count; ++i) { 691*0b57cec5SDimitry Andric PythonObject obj = GetItemAtIndex(i); 692*0b57cec5SDimitry Andric result->AddItem(obj.CreateStructuredObject()); 693*0b57cec5SDimitry Andric } 694*0b57cec5SDimitry Andric return result; 695*0b57cec5SDimitry Andric } 696*0b57cec5SDimitry Andric 697*0b57cec5SDimitry Andric // PythonDictionary 698*0b57cec5SDimitry Andric 6999dba64beSDimitry Andric PythonDictionary::PythonDictionary(PyInitialValue value) { 700*0b57cec5SDimitry Andric if (value == PyInitialValue::Empty) 7019dba64beSDimitry Andric *this = Take<PythonDictionary>(PyDict_New()); 702*0b57cec5SDimitry Andric } 703*0b57cec5SDimitry Andric 704*0b57cec5SDimitry Andric bool PythonDictionary::Check(PyObject *py_obj) { 705*0b57cec5SDimitry Andric if (!py_obj) 706*0b57cec5SDimitry Andric return false; 707*0b57cec5SDimitry Andric 708*0b57cec5SDimitry Andric return PyDict_Check(py_obj); 709*0b57cec5SDimitry Andric } 710*0b57cec5SDimitry Andric 711*0b57cec5SDimitry Andric uint32_t PythonDictionary::GetSize() const { 712*0b57cec5SDimitry Andric if (IsValid()) 713*0b57cec5SDimitry Andric return PyDict_Size(m_py_obj); 714*0b57cec5SDimitry Andric return 0; 715*0b57cec5SDimitry Andric } 716*0b57cec5SDimitry Andric 717*0b57cec5SDimitry Andric PythonList PythonDictionary::GetKeys() const { 718*0b57cec5SDimitry Andric if (IsValid()) 719*0b57cec5SDimitry Andric return PythonList(PyRefType::Owned, PyDict_Keys(m_py_obj)); 720*0b57cec5SDimitry Andric return PythonList(PyInitialValue::Invalid); 721*0b57cec5SDimitry Andric } 722*0b57cec5SDimitry Andric 723*0b57cec5SDimitry Andric PythonObject PythonDictionary::GetItemForKey(const PythonObject &key) const { 7249dba64beSDimitry Andric auto item = GetItem(key); 7259dba64beSDimitry Andric if (!item) { 7269dba64beSDimitry Andric llvm::consumeError(item.takeError()); 727*0b57cec5SDimitry Andric return PythonObject(); 728*0b57cec5SDimitry Andric } 7299dba64beSDimitry Andric return std::move(item.get()); 7309dba64beSDimitry Andric } 7319dba64beSDimitry Andric 7329dba64beSDimitry Andric Expected<PythonObject> 7339dba64beSDimitry Andric PythonDictionary::GetItem(const PythonObject &key) const { 7349dba64beSDimitry Andric if (!IsValid()) 7359dba64beSDimitry Andric return nullDeref(); 7369dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 7379dba64beSDimitry Andric PyObject *o = PyDict_GetItemWithError(m_py_obj, key.get()); 7389dba64beSDimitry Andric if (PyErr_Occurred()) 7399dba64beSDimitry Andric return exception(); 7409dba64beSDimitry Andric #else 7419dba64beSDimitry Andric PyObject *o = PyDict_GetItem(m_py_obj, key.get()); 7429dba64beSDimitry Andric #endif 7439dba64beSDimitry Andric if (!o) 7449dba64beSDimitry Andric return keyError(); 7459dba64beSDimitry Andric return Retain<PythonObject>(o); 7469dba64beSDimitry Andric } 7479dba64beSDimitry Andric 7489dba64beSDimitry Andric Expected<PythonObject> PythonDictionary::GetItem(const Twine &key) const { 7499dba64beSDimitry Andric if (!IsValid()) 7509dba64beSDimitry Andric return nullDeref(); 7519dba64beSDimitry Andric PyObject *o = PyDict_GetItemString(m_py_obj, NullTerminated(key)); 7529dba64beSDimitry Andric if (PyErr_Occurred()) 7539dba64beSDimitry Andric return exception(); 7549dba64beSDimitry Andric if (!o) 7559dba64beSDimitry Andric return keyError(); 7569dba64beSDimitry Andric return Retain<PythonObject>(o); 7579dba64beSDimitry Andric } 7589dba64beSDimitry Andric 7599dba64beSDimitry Andric Error PythonDictionary::SetItem(const PythonObject &key, 7609dba64beSDimitry Andric const PythonObject &value) const { 7619dba64beSDimitry Andric if (!IsValid() || !value.IsValid()) 7629dba64beSDimitry Andric return nullDeref(); 7639dba64beSDimitry Andric int r = PyDict_SetItem(m_py_obj, key.get(), value.get()); 7649dba64beSDimitry Andric if (r < 0) 7659dba64beSDimitry Andric return exception(); 7669dba64beSDimitry Andric return Error::success(); 7679dba64beSDimitry Andric } 7689dba64beSDimitry Andric 7699dba64beSDimitry Andric Error PythonDictionary::SetItem(const Twine &key, 7709dba64beSDimitry Andric const PythonObject &value) const { 7719dba64beSDimitry Andric if (!IsValid() || !value.IsValid()) 7729dba64beSDimitry Andric return nullDeref(); 7739dba64beSDimitry Andric int r = PyDict_SetItemString(m_py_obj, NullTerminated(key), value.get()); 7749dba64beSDimitry Andric if (r < 0) 7759dba64beSDimitry Andric return exception(); 7769dba64beSDimitry Andric return Error::success(); 7779dba64beSDimitry Andric } 778*0b57cec5SDimitry Andric 779*0b57cec5SDimitry Andric void PythonDictionary::SetItemForKey(const PythonObject &key, 780*0b57cec5SDimitry Andric const PythonObject &value) { 7819dba64beSDimitry Andric Error error = SetItem(key, value); 7829dba64beSDimitry Andric if (error) 7839dba64beSDimitry Andric llvm::consumeError(std::move(error)); 784*0b57cec5SDimitry Andric } 785*0b57cec5SDimitry Andric 786*0b57cec5SDimitry Andric StructuredData::DictionarySP 787*0b57cec5SDimitry Andric PythonDictionary::CreateStructuredDictionary() const { 788*0b57cec5SDimitry Andric StructuredData::DictionarySP result(new StructuredData::Dictionary); 789*0b57cec5SDimitry Andric PythonList keys(GetKeys()); 790*0b57cec5SDimitry Andric uint32_t num_keys = keys.GetSize(); 791*0b57cec5SDimitry Andric for (uint32_t i = 0; i < num_keys; ++i) { 792*0b57cec5SDimitry Andric PythonObject key = keys.GetItemAtIndex(i); 793*0b57cec5SDimitry Andric PythonObject value = GetItemForKey(key); 794*0b57cec5SDimitry Andric StructuredData::ObjectSP structured_value = value.CreateStructuredObject(); 795*0b57cec5SDimitry Andric result->AddItem(key.Str().GetString(), structured_value); 796*0b57cec5SDimitry Andric } 797*0b57cec5SDimitry Andric return result; 798*0b57cec5SDimitry Andric } 799*0b57cec5SDimitry Andric 800*0b57cec5SDimitry Andric PythonModule PythonModule::BuiltinsModule() { 801*0b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 802*0b57cec5SDimitry Andric return AddModule("builtins"); 803*0b57cec5SDimitry Andric #else 804*0b57cec5SDimitry Andric return AddModule("__builtin__"); 805*0b57cec5SDimitry Andric #endif 806*0b57cec5SDimitry Andric } 807*0b57cec5SDimitry Andric 808*0b57cec5SDimitry Andric PythonModule PythonModule::MainModule() { return AddModule("__main__"); } 809*0b57cec5SDimitry Andric 810*0b57cec5SDimitry Andric PythonModule PythonModule::AddModule(llvm::StringRef module) { 811*0b57cec5SDimitry Andric std::string str = module.str(); 812*0b57cec5SDimitry Andric return PythonModule(PyRefType::Borrowed, PyImport_AddModule(str.c_str())); 813*0b57cec5SDimitry Andric } 814*0b57cec5SDimitry Andric 8159dba64beSDimitry Andric Expected<PythonModule> PythonModule::Import(const Twine &name) { 8169dba64beSDimitry Andric PyObject *mod = PyImport_ImportModule(NullTerminated(name)); 8179dba64beSDimitry Andric if (!mod) 8189dba64beSDimitry Andric return exception(); 8199dba64beSDimitry Andric return Take<PythonModule>(mod); 8209dba64beSDimitry Andric } 8219dba64beSDimitry Andric 8229dba64beSDimitry Andric Expected<PythonObject> PythonModule::Get(const Twine &name) { 8239dba64beSDimitry Andric if (!IsValid()) 8249dba64beSDimitry Andric return nullDeref(); 8259dba64beSDimitry Andric PyObject *dict = PyModule_GetDict(m_py_obj); 8269dba64beSDimitry Andric if (!dict) 8279dba64beSDimitry Andric return exception(); 8289dba64beSDimitry Andric PyObject *item = PyDict_GetItemString(dict, NullTerminated(name)); 8299dba64beSDimitry Andric if (!item) 8309dba64beSDimitry Andric return exception(); 8319dba64beSDimitry Andric return Retain<PythonObject>(item); 832*0b57cec5SDimitry Andric } 833*0b57cec5SDimitry Andric 834*0b57cec5SDimitry Andric bool PythonModule::Check(PyObject *py_obj) { 835*0b57cec5SDimitry Andric if (!py_obj) 836*0b57cec5SDimitry Andric return false; 837*0b57cec5SDimitry Andric 838*0b57cec5SDimitry Andric return PyModule_Check(py_obj); 839*0b57cec5SDimitry Andric } 840*0b57cec5SDimitry Andric 841*0b57cec5SDimitry Andric PythonDictionary PythonModule::GetDictionary() const { 8429dba64beSDimitry Andric if (!IsValid()) 8439dba64beSDimitry Andric return PythonDictionary(); 8449dba64beSDimitry Andric return Retain<PythonDictionary>(PyModule_GetDict(m_py_obj)); 845*0b57cec5SDimitry Andric } 846*0b57cec5SDimitry Andric 847*0b57cec5SDimitry Andric bool PythonCallable::Check(PyObject *py_obj) { 848*0b57cec5SDimitry Andric if (!py_obj) 849*0b57cec5SDimitry Andric return false; 850*0b57cec5SDimitry Andric 851*0b57cec5SDimitry Andric return PyCallable_Check(py_obj); 852*0b57cec5SDimitry Andric } 853*0b57cec5SDimitry Andric 8549dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 && PY_MINOR_VERSION >= 3 8559dba64beSDimitry Andric static const char get_arg_info_script[] = R"( 8569dba64beSDimitry Andric from inspect import signature, Parameter, ismethod 8579dba64beSDimitry Andric from collections import namedtuple 858480093f4SDimitry Andric ArgInfo = namedtuple('ArgInfo', ['count', 'has_varargs']) 8599dba64beSDimitry Andric def main(f): 8609dba64beSDimitry Andric count = 0 8619dba64beSDimitry Andric varargs = False 8629dba64beSDimitry Andric for parameter in signature(f).parameters.values(): 8639dba64beSDimitry Andric kind = parameter.kind 8649dba64beSDimitry Andric if kind in (Parameter.POSITIONAL_ONLY, 8659dba64beSDimitry Andric Parameter.POSITIONAL_OR_KEYWORD): 8669dba64beSDimitry Andric count += 1 8679dba64beSDimitry Andric elif kind == Parameter.VAR_POSITIONAL: 8689dba64beSDimitry Andric varargs = True 8699dba64beSDimitry Andric elif kind in (Parameter.KEYWORD_ONLY, 8709dba64beSDimitry Andric Parameter.VAR_KEYWORD): 8719dba64beSDimitry Andric pass 8729dba64beSDimitry Andric else: 8739dba64beSDimitry Andric raise Exception(f'unknown parameter kind: {kind}') 874480093f4SDimitry Andric return ArgInfo(count, varargs) 8759dba64beSDimitry Andric )"; 8769dba64beSDimitry Andric #endif 8779dba64beSDimitry Andric 8789dba64beSDimitry Andric Expected<PythonCallable::ArgInfo> PythonCallable::GetArgInfo() const { 8799dba64beSDimitry Andric ArgInfo result = {}; 8809dba64beSDimitry Andric if (!IsValid()) 8819dba64beSDimitry Andric return nullDeref(); 8829dba64beSDimitry Andric 8839dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 && PY_MINOR_VERSION >= 3 8849dba64beSDimitry Andric 8859dba64beSDimitry Andric // no need to synchronize access to this global, we already have the GIL 8869dba64beSDimitry Andric static PythonScript get_arg_info(get_arg_info_script); 8879dba64beSDimitry Andric Expected<PythonObject> pyarginfo = get_arg_info(*this); 8889dba64beSDimitry Andric if (!pyarginfo) 8899dba64beSDimitry Andric return pyarginfo.takeError(); 890480093f4SDimitry Andric long long count = 891480093f4SDimitry Andric cantFail(As<long long>(pyarginfo.get().GetAttribute("count"))); 892480093f4SDimitry Andric bool has_varargs = 8939dba64beSDimitry Andric cantFail(As<bool>(pyarginfo.get().GetAttribute("has_varargs"))); 894480093f4SDimitry Andric result.max_positional_args = has_varargs ? ArgInfo::UNBOUNDED : count; 8959dba64beSDimitry Andric 8969dba64beSDimitry Andric #else 897480093f4SDimitry Andric PyObject *py_func_obj; 8989dba64beSDimitry Andric bool is_bound_method = false; 899480093f4SDimitry Andric bool is_class = false; 900480093f4SDimitry Andric 901480093f4SDimitry Andric if (PyType_Check(m_py_obj) || PyClass_Check(m_py_obj)) { 902480093f4SDimitry Andric auto init = GetAttribute("__init__"); 903480093f4SDimitry Andric if (!init) 904480093f4SDimitry Andric return init.takeError(); 905480093f4SDimitry Andric py_func_obj = init.get().get(); 906480093f4SDimitry Andric is_class = true; 907480093f4SDimitry Andric } else { 908480093f4SDimitry Andric py_func_obj = m_py_obj; 909480093f4SDimitry Andric } 910480093f4SDimitry Andric 911*0b57cec5SDimitry Andric if (PyMethod_Check(py_func_obj)) { 912*0b57cec5SDimitry Andric py_func_obj = PyMethod_GET_FUNCTION(py_func_obj); 913*0b57cec5SDimitry Andric PythonObject im_self = GetAttributeValue("im_self"); 914*0b57cec5SDimitry Andric if (im_self.IsValid() && !im_self.IsNone()) 9159dba64beSDimitry Andric is_bound_method = true; 916*0b57cec5SDimitry Andric } else { 917*0b57cec5SDimitry Andric // see if this is a callable object with an __call__ method 918*0b57cec5SDimitry Andric if (!PyFunction_Check(py_func_obj)) { 919*0b57cec5SDimitry Andric PythonObject __call__ = GetAttributeValue("__call__"); 920*0b57cec5SDimitry Andric if (__call__.IsValid()) { 921*0b57cec5SDimitry Andric auto __callable__ = __call__.AsType<PythonCallable>(); 922*0b57cec5SDimitry Andric if (__callable__.IsValid()) { 923*0b57cec5SDimitry Andric py_func_obj = PyMethod_GET_FUNCTION(__callable__.get()); 9249dba64beSDimitry Andric PythonObject im_self = __callable__.GetAttributeValue("im_self"); 925*0b57cec5SDimitry Andric if (im_self.IsValid() && !im_self.IsNone()) 9269dba64beSDimitry Andric is_bound_method = true; 927*0b57cec5SDimitry Andric } 928*0b57cec5SDimitry Andric } 929*0b57cec5SDimitry Andric } 930*0b57cec5SDimitry Andric } 931*0b57cec5SDimitry Andric 932*0b57cec5SDimitry Andric if (!py_func_obj) 933*0b57cec5SDimitry Andric return result; 934*0b57cec5SDimitry Andric 935*0b57cec5SDimitry Andric PyCodeObject *code = (PyCodeObject *)PyFunction_GET_CODE(py_func_obj); 936*0b57cec5SDimitry Andric if (!code) 937*0b57cec5SDimitry Andric return result; 938*0b57cec5SDimitry Andric 939480093f4SDimitry Andric auto count = code->co_argcount; 940480093f4SDimitry Andric bool has_varargs = !!(code->co_flags & CO_VARARGS); 941480093f4SDimitry Andric result.max_positional_args = 942480093f4SDimitry Andric has_varargs ? ArgInfo::UNBOUNDED 943480093f4SDimitry Andric : (count - (int)is_bound_method) - (int)is_class; 9449dba64beSDimitry Andric 9459dba64beSDimitry Andric #endif 9469dba64beSDimitry Andric 947*0b57cec5SDimitry Andric return result; 948*0b57cec5SDimitry Andric } 949*0b57cec5SDimitry Andric 9509dba64beSDimitry Andric constexpr unsigned 9519dba64beSDimitry Andric PythonCallable::ArgInfo::UNBOUNDED; // FIXME delete after c++17 9529dba64beSDimitry Andric 953*0b57cec5SDimitry Andric PythonObject PythonCallable::operator()() { 954*0b57cec5SDimitry Andric return PythonObject(PyRefType::Owned, PyObject_CallObject(m_py_obj, nullptr)); 955*0b57cec5SDimitry Andric } 956*0b57cec5SDimitry Andric 957*0b57cec5SDimitry Andric PythonObject PythonCallable:: 958*0b57cec5SDimitry Andric operator()(std::initializer_list<PyObject *> args) { 959*0b57cec5SDimitry Andric PythonTuple arg_tuple(args); 960*0b57cec5SDimitry Andric return PythonObject(PyRefType::Owned, 961*0b57cec5SDimitry Andric PyObject_CallObject(m_py_obj, arg_tuple.get())); 962*0b57cec5SDimitry Andric } 963*0b57cec5SDimitry Andric 964*0b57cec5SDimitry Andric PythonObject PythonCallable:: 965*0b57cec5SDimitry Andric operator()(std::initializer_list<PythonObject> args) { 966*0b57cec5SDimitry Andric PythonTuple arg_tuple(args); 967*0b57cec5SDimitry Andric return PythonObject(PyRefType::Owned, 968*0b57cec5SDimitry Andric PyObject_CallObject(m_py_obj, arg_tuple.get())); 969*0b57cec5SDimitry Andric } 970*0b57cec5SDimitry Andric 971*0b57cec5SDimitry Andric bool PythonFile::Check(PyObject *py_obj) { 9729dba64beSDimitry Andric if (!py_obj) 9739dba64beSDimitry Andric return false; 974*0b57cec5SDimitry Andric #if PY_MAJOR_VERSION < 3 975*0b57cec5SDimitry Andric return PyFile_Check(py_obj); 976*0b57cec5SDimitry Andric #else 977*0b57cec5SDimitry Andric // In Python 3, there is no `PyFile_Check`, and in fact PyFile is not even a 978*0b57cec5SDimitry Andric // first-class object type anymore. `PyFile_FromFd` is just a thin wrapper 979*0b57cec5SDimitry Andric // over `io.open()`, which returns some object derived from `io.IOBase`. As a 980*0b57cec5SDimitry Andric // result, the only way to detect a file in Python 3 is to check whether it 9819dba64beSDimitry Andric // inherits from `io.IOBase`. 9829dba64beSDimitry Andric auto io_module = PythonModule::Import("io"); 9839dba64beSDimitry Andric if (!io_module) { 9849dba64beSDimitry Andric llvm::consumeError(io_module.takeError()); 985*0b57cec5SDimitry Andric return false; 9869dba64beSDimitry Andric } 9879dba64beSDimitry Andric auto iobase = io_module.get().Get("IOBase"); 9889dba64beSDimitry Andric if (!iobase) { 9899dba64beSDimitry Andric llvm::consumeError(iobase.takeError()); 990*0b57cec5SDimitry Andric return false; 9919dba64beSDimitry Andric } 9929dba64beSDimitry Andric int r = PyObject_IsInstance(py_obj, iobase.get().get()); 9939dba64beSDimitry Andric if (r < 0) { 9949dba64beSDimitry Andric llvm::consumeError(exception()); // clear the exception and log it. 9959dba64beSDimitry Andric return false; 9969dba64beSDimitry Andric } 9979dba64beSDimitry Andric return !!r; 998*0b57cec5SDimitry Andric #endif 999*0b57cec5SDimitry Andric } 1000*0b57cec5SDimitry Andric 10019dba64beSDimitry Andric namespace { 10029dba64beSDimitry Andric class GIL { 10039dba64beSDimitry Andric public: 10049dba64beSDimitry Andric GIL() { 10059dba64beSDimitry Andric m_state = PyGILState_Ensure(); 10069dba64beSDimitry Andric assert(!PyErr_Occurred()); 10079dba64beSDimitry Andric } 10089dba64beSDimitry Andric ~GIL() { PyGILState_Release(m_state); } 1009*0b57cec5SDimitry Andric 10109dba64beSDimitry Andric protected: 10119dba64beSDimitry Andric PyGILState_STATE m_state; 10129dba64beSDimitry Andric }; 10139dba64beSDimitry Andric } // namespace 10149dba64beSDimitry Andric 10159dba64beSDimitry Andric const char *PythonException::toCString() const { 10169dba64beSDimitry Andric if (!m_repr_bytes) 10179dba64beSDimitry Andric return "unknown exception"; 10189dba64beSDimitry Andric return PyBytes_AS_STRING(m_repr_bytes); 1019*0b57cec5SDimitry Andric } 1020*0b57cec5SDimitry Andric 10219dba64beSDimitry Andric PythonException::PythonException(const char *caller) { 10229dba64beSDimitry Andric assert(PyErr_Occurred()); 10239dba64beSDimitry Andric m_exception_type = m_exception = m_traceback = m_repr_bytes = NULL; 10249dba64beSDimitry Andric PyErr_Fetch(&m_exception_type, &m_exception, &m_traceback); 10259dba64beSDimitry Andric PyErr_NormalizeException(&m_exception_type, &m_exception, &m_traceback); 10269dba64beSDimitry Andric PyErr_Clear(); 10279dba64beSDimitry Andric if (m_exception) { 10289dba64beSDimitry Andric PyObject *repr = PyObject_Repr(m_exception); 10299dba64beSDimitry Andric if (repr) { 10309dba64beSDimitry Andric m_repr_bytes = PyUnicode_AsEncodedString(repr, "utf-8", nullptr); 10319dba64beSDimitry Andric if (!m_repr_bytes) { 10329dba64beSDimitry Andric PyErr_Clear(); 10339dba64beSDimitry Andric } 10349dba64beSDimitry Andric Py_XDECREF(repr); 10359dba64beSDimitry Andric } else { 10369dba64beSDimitry Andric PyErr_Clear(); 10379dba64beSDimitry Andric } 10389dba64beSDimitry Andric } 10399dba64beSDimitry Andric Log *log = GetLogIfAllCategoriesSet(LIBLLDB_LOG_SCRIPT); 10409dba64beSDimitry Andric if (caller) 10419dba64beSDimitry Andric LLDB_LOGF(log, "%s failed with exception: %s", caller, toCString()); 10429dba64beSDimitry Andric else 10439dba64beSDimitry Andric LLDB_LOGF(log, "python exception: %s", toCString()); 10449dba64beSDimitry Andric } 10459dba64beSDimitry Andric void PythonException::Restore() { 10469dba64beSDimitry Andric if (m_exception_type && m_exception) { 10479dba64beSDimitry Andric PyErr_Restore(m_exception_type, m_exception, m_traceback); 10489dba64beSDimitry Andric } else { 10499dba64beSDimitry Andric PyErr_SetString(PyExc_Exception, toCString()); 10509dba64beSDimitry Andric } 10519dba64beSDimitry Andric m_exception_type = m_exception = m_traceback = NULL; 1052*0b57cec5SDimitry Andric } 1053*0b57cec5SDimitry Andric 10549dba64beSDimitry Andric PythonException::~PythonException() { 10559dba64beSDimitry Andric Py_XDECREF(m_exception_type); 10569dba64beSDimitry Andric Py_XDECREF(m_exception); 10579dba64beSDimitry Andric Py_XDECREF(m_traceback); 10589dba64beSDimitry Andric Py_XDECREF(m_repr_bytes); 1059*0b57cec5SDimitry Andric } 1060*0b57cec5SDimitry Andric 10619dba64beSDimitry Andric void PythonException::log(llvm::raw_ostream &OS) const { OS << toCString(); } 10629dba64beSDimitry Andric 10639dba64beSDimitry Andric std::error_code PythonException::convertToErrorCode() const { 10649dba64beSDimitry Andric return llvm::inconvertibleErrorCode(); 10659dba64beSDimitry Andric } 10669dba64beSDimitry Andric 10679dba64beSDimitry Andric bool PythonException::Matches(PyObject *exc) const { 10689dba64beSDimitry Andric return PyErr_GivenExceptionMatches(m_exception_type, exc); 10699dba64beSDimitry Andric } 10709dba64beSDimitry Andric 10719dba64beSDimitry Andric const char read_exception_script[] = R"( 10729dba64beSDimitry Andric import sys 10739dba64beSDimitry Andric from traceback import print_exception 10749dba64beSDimitry Andric if sys.version_info.major < 3: 10759dba64beSDimitry Andric from StringIO import StringIO 10769dba64beSDimitry Andric else: 10779dba64beSDimitry Andric from io import StringIO 10789dba64beSDimitry Andric def main(exc_type, exc_value, tb): 10799dba64beSDimitry Andric f = StringIO() 10809dba64beSDimitry Andric print_exception(exc_type, exc_value, tb, file=f) 10819dba64beSDimitry Andric return f.getvalue() 10829dba64beSDimitry Andric )"; 10839dba64beSDimitry Andric 10849dba64beSDimitry Andric std::string PythonException::ReadBacktrace() const { 10859dba64beSDimitry Andric 10869dba64beSDimitry Andric if (!m_traceback) 10879dba64beSDimitry Andric return toCString(); 10889dba64beSDimitry Andric 10899dba64beSDimitry Andric // no need to synchronize access to this global, we already have the GIL 10909dba64beSDimitry Andric static PythonScript read_exception(read_exception_script); 10919dba64beSDimitry Andric 10929dba64beSDimitry Andric Expected<std::string> backtrace = As<std::string>( 10939dba64beSDimitry Andric read_exception(m_exception_type, m_exception, m_traceback)); 10949dba64beSDimitry Andric 10959dba64beSDimitry Andric if (!backtrace) { 10969dba64beSDimitry Andric std::string message = 10979dba64beSDimitry Andric std::string(toCString()) + "\n" + 10985ffd83dbSDimitry Andric "Traceback unavailable, an error occurred while reading it:\n"; 10999dba64beSDimitry Andric return (message + llvm::toString(backtrace.takeError())); 11009dba64beSDimitry Andric } 11019dba64beSDimitry Andric 11029dba64beSDimitry Andric return std::move(backtrace.get()); 11039dba64beSDimitry Andric } 11049dba64beSDimitry Andric 11059dba64beSDimitry Andric char PythonException::ID = 0; 11069dba64beSDimitry Andric 11079dba64beSDimitry Andric llvm::Expected<File::OpenOptions> 11089dba64beSDimitry Andric GetOptionsForPyObject(const PythonObject &obj) { 1109*0b57cec5SDimitry Andric #if PY_MAJOR_VERSION >= 3 11109dba64beSDimitry Andric auto options = File::OpenOptions(0); 11119dba64beSDimitry Andric auto readable = As<bool>(obj.CallMethod("readable")); 11129dba64beSDimitry Andric if (!readable) 11139dba64beSDimitry Andric return readable.takeError(); 11149dba64beSDimitry Andric auto writable = As<bool>(obj.CallMethod("writable")); 11159dba64beSDimitry Andric if (!writable) 11169dba64beSDimitry Andric return writable.takeError(); 11179dba64beSDimitry Andric if (readable.get()) 11189dba64beSDimitry Andric options |= File::eOpenOptionRead; 11199dba64beSDimitry Andric if (writable.get()) 11209dba64beSDimitry Andric options |= File::eOpenOptionWrite; 11219dba64beSDimitry Andric return options; 11229dba64beSDimitry Andric #else 11239dba64beSDimitry Andric PythonString py_mode = obj.GetAttributeValue("mode").AsType<PythonString>(); 11249dba64beSDimitry Andric return File::GetOptionsFromMode(py_mode.GetString()); 11259dba64beSDimitry Andric #endif 11269dba64beSDimitry Andric } 11279dba64beSDimitry Andric 11289dba64beSDimitry Andric // Base class template for python files. All it knows how to do 11299dba64beSDimitry Andric // is hold a reference to the python object and close or flush it 11309dba64beSDimitry Andric // when the File is closed. 11319dba64beSDimitry Andric namespace { 11329dba64beSDimitry Andric template <typename Base> class OwnedPythonFile : public Base { 11339dba64beSDimitry Andric public: 11349dba64beSDimitry Andric template <typename... Args> 11359dba64beSDimitry Andric OwnedPythonFile(const PythonFile &file, bool borrowed, Args... args) 11369dba64beSDimitry Andric : Base(args...), m_py_obj(file), m_borrowed(borrowed) { 11379dba64beSDimitry Andric assert(m_py_obj); 11389dba64beSDimitry Andric } 11399dba64beSDimitry Andric 11409dba64beSDimitry Andric ~OwnedPythonFile() override { 11419dba64beSDimitry Andric assert(m_py_obj); 11429dba64beSDimitry Andric GIL takeGIL; 11439dba64beSDimitry Andric Close(); 11449dba64beSDimitry Andric // we need to ensure the python object is released while we still 11459dba64beSDimitry Andric // hold the GIL 11469dba64beSDimitry Andric m_py_obj.Reset(); 11479dba64beSDimitry Andric } 11489dba64beSDimitry Andric 11499dba64beSDimitry Andric bool IsPythonSideValid() const { 11509dba64beSDimitry Andric GIL takeGIL; 11519dba64beSDimitry Andric auto closed = As<bool>(m_py_obj.GetAttribute("closed")); 11529dba64beSDimitry Andric if (!closed) { 11539dba64beSDimitry Andric llvm::consumeError(closed.takeError()); 11549dba64beSDimitry Andric return false; 11559dba64beSDimitry Andric } 11569dba64beSDimitry Andric return !closed.get(); 11579dba64beSDimitry Andric } 11589dba64beSDimitry Andric 11599dba64beSDimitry Andric bool IsValid() const override { 11609dba64beSDimitry Andric return IsPythonSideValid() && Base::IsValid(); 11619dba64beSDimitry Andric } 11629dba64beSDimitry Andric 11639dba64beSDimitry Andric Status Close() override { 11649dba64beSDimitry Andric assert(m_py_obj); 11659dba64beSDimitry Andric Status py_error, base_error; 11669dba64beSDimitry Andric GIL takeGIL; 11679dba64beSDimitry Andric if (!m_borrowed) { 11689dba64beSDimitry Andric auto r = m_py_obj.CallMethod("close"); 11699dba64beSDimitry Andric if (!r) 11709dba64beSDimitry Andric py_error = Status(r.takeError()); 11719dba64beSDimitry Andric } 11729dba64beSDimitry Andric base_error = Base::Close(); 11739dba64beSDimitry Andric if (py_error.Fail()) 11749dba64beSDimitry Andric return py_error; 11759dba64beSDimitry Andric return base_error; 11769dba64beSDimitry Andric }; 11779dba64beSDimitry Andric 11789dba64beSDimitry Andric PyObject *GetPythonObject() const { 11799dba64beSDimitry Andric assert(m_py_obj.IsValid()); 11809dba64beSDimitry Andric return m_py_obj.get(); 11819dba64beSDimitry Andric } 11829dba64beSDimitry Andric 11839dba64beSDimitry Andric static bool classof(const File *file) = delete; 11849dba64beSDimitry Andric 11859dba64beSDimitry Andric protected: 11869dba64beSDimitry Andric PythonFile m_py_obj; 11879dba64beSDimitry Andric bool m_borrowed; 11889dba64beSDimitry Andric }; 11899dba64beSDimitry Andric } // namespace 11909dba64beSDimitry Andric 11919dba64beSDimitry Andric // A SimplePythonFile is a OwnedPythonFile that just does all I/O as 11929dba64beSDimitry Andric // a NativeFile 11939dba64beSDimitry Andric namespace { 11949dba64beSDimitry Andric class SimplePythonFile : public OwnedPythonFile<NativeFile> { 11959dba64beSDimitry Andric public: 11969dba64beSDimitry Andric SimplePythonFile(const PythonFile &file, bool borrowed, int fd, 11979dba64beSDimitry Andric File::OpenOptions options) 11989dba64beSDimitry Andric : OwnedPythonFile(file, borrowed, fd, options, false) {} 11999dba64beSDimitry Andric 12009dba64beSDimitry Andric static char ID; 12019dba64beSDimitry Andric bool isA(const void *classID) const override { 12029dba64beSDimitry Andric return classID == &ID || NativeFile::isA(classID); 12039dba64beSDimitry Andric } 12049dba64beSDimitry Andric static bool classof(const File *file) { return file->isA(&ID); } 12059dba64beSDimitry Andric }; 12069dba64beSDimitry Andric char SimplePythonFile::ID = 0; 12079dba64beSDimitry Andric } // namespace 12089dba64beSDimitry Andric 12099dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 12109dba64beSDimitry Andric 12119dba64beSDimitry Andric namespace { 12129dba64beSDimitry Andric class PythonBuffer { 12139dba64beSDimitry Andric public: 12149dba64beSDimitry Andric PythonBuffer &operator=(const PythonBuffer &) = delete; 12159dba64beSDimitry Andric PythonBuffer(const PythonBuffer &) = delete; 12169dba64beSDimitry Andric 12179dba64beSDimitry Andric static Expected<PythonBuffer> Create(PythonObject &obj, 12189dba64beSDimitry Andric int flags = PyBUF_SIMPLE) { 12199dba64beSDimitry Andric Py_buffer py_buffer = {}; 12209dba64beSDimitry Andric PyObject_GetBuffer(obj.get(), &py_buffer, flags); 12219dba64beSDimitry Andric if (!py_buffer.obj) 12229dba64beSDimitry Andric return llvm::make_error<PythonException>(); 12239dba64beSDimitry Andric return PythonBuffer(py_buffer); 12249dba64beSDimitry Andric } 12259dba64beSDimitry Andric 12269dba64beSDimitry Andric PythonBuffer(PythonBuffer &&other) { 12279dba64beSDimitry Andric m_buffer = other.m_buffer; 12289dba64beSDimitry Andric other.m_buffer.obj = nullptr; 12299dba64beSDimitry Andric } 12309dba64beSDimitry Andric 12319dba64beSDimitry Andric ~PythonBuffer() { 12329dba64beSDimitry Andric if (m_buffer.obj) 12339dba64beSDimitry Andric PyBuffer_Release(&m_buffer); 12349dba64beSDimitry Andric } 12359dba64beSDimitry Andric 12369dba64beSDimitry Andric Py_buffer &get() { return m_buffer; } 12379dba64beSDimitry Andric 12389dba64beSDimitry Andric private: 12399dba64beSDimitry Andric // takes ownership of the buffer. 12409dba64beSDimitry Andric PythonBuffer(const Py_buffer &py_buffer) : m_buffer(py_buffer) {} 12419dba64beSDimitry Andric Py_buffer m_buffer; 12429dba64beSDimitry Andric }; 12439dba64beSDimitry Andric } // namespace 12449dba64beSDimitry Andric 12459dba64beSDimitry Andric // Shared methods between TextPythonFile and BinaryPythonFile 12469dba64beSDimitry Andric namespace { 12479dba64beSDimitry Andric class PythonIOFile : public OwnedPythonFile<File> { 12489dba64beSDimitry Andric public: 12499dba64beSDimitry Andric PythonIOFile(const PythonFile &file, bool borrowed) 12509dba64beSDimitry Andric : OwnedPythonFile(file, borrowed) {} 12519dba64beSDimitry Andric 12529dba64beSDimitry Andric ~PythonIOFile() override { Close(); } 12539dba64beSDimitry Andric 12549dba64beSDimitry Andric bool IsValid() const override { return IsPythonSideValid(); } 12559dba64beSDimitry Andric 12569dba64beSDimitry Andric Status Close() override { 12579dba64beSDimitry Andric assert(m_py_obj); 12589dba64beSDimitry Andric GIL takeGIL; 12599dba64beSDimitry Andric if (m_borrowed) 12609dba64beSDimitry Andric return Flush(); 12619dba64beSDimitry Andric auto r = m_py_obj.CallMethod("close"); 12629dba64beSDimitry Andric if (!r) 12639dba64beSDimitry Andric return Status(r.takeError()); 12649dba64beSDimitry Andric return Status(); 12659dba64beSDimitry Andric } 12669dba64beSDimitry Andric 12679dba64beSDimitry Andric Status Flush() override { 12689dba64beSDimitry Andric GIL takeGIL; 12699dba64beSDimitry Andric auto r = m_py_obj.CallMethod("flush"); 12709dba64beSDimitry Andric if (!r) 12719dba64beSDimitry Andric return Status(r.takeError()); 12729dba64beSDimitry Andric return Status(); 12739dba64beSDimitry Andric } 12749dba64beSDimitry Andric 12759dba64beSDimitry Andric Expected<File::OpenOptions> GetOptions() const override { 12769dba64beSDimitry Andric GIL takeGIL; 12779dba64beSDimitry Andric return GetOptionsForPyObject(m_py_obj); 12789dba64beSDimitry Andric } 12799dba64beSDimitry Andric 12809dba64beSDimitry Andric static char ID; 12819dba64beSDimitry Andric bool isA(const void *classID) const override { 12829dba64beSDimitry Andric return classID == &ID || File::isA(classID); 12839dba64beSDimitry Andric } 12849dba64beSDimitry Andric static bool classof(const File *file) { return file->isA(&ID); } 12859dba64beSDimitry Andric }; 12869dba64beSDimitry Andric char PythonIOFile::ID = 0; 12879dba64beSDimitry Andric } // namespace 12889dba64beSDimitry Andric 12899dba64beSDimitry Andric namespace { 12909dba64beSDimitry Andric class BinaryPythonFile : public PythonIOFile { 12919dba64beSDimitry Andric protected: 12929dba64beSDimitry Andric int m_descriptor; 12939dba64beSDimitry Andric 12949dba64beSDimitry Andric public: 12959dba64beSDimitry Andric BinaryPythonFile(int fd, const PythonFile &file, bool borrowed) 12969dba64beSDimitry Andric : PythonIOFile(file, borrowed), 12979dba64beSDimitry Andric m_descriptor(File::DescriptorIsValid(fd) ? fd 12989dba64beSDimitry Andric : File::kInvalidDescriptor) {} 12999dba64beSDimitry Andric 13009dba64beSDimitry Andric int GetDescriptor() const override { return m_descriptor; } 13019dba64beSDimitry Andric 13029dba64beSDimitry Andric Status Write(const void *buf, size_t &num_bytes) override { 13039dba64beSDimitry Andric GIL takeGIL; 13049dba64beSDimitry Andric PyObject *pybuffer_p = PyMemoryView_FromMemory( 13059dba64beSDimitry Andric const_cast<char *>((const char *)buf), num_bytes, PyBUF_READ); 13069dba64beSDimitry Andric if (!pybuffer_p) 13079dba64beSDimitry Andric return Status(llvm::make_error<PythonException>()); 13089dba64beSDimitry Andric auto pybuffer = Take<PythonObject>(pybuffer_p); 13099dba64beSDimitry Andric num_bytes = 0; 13109dba64beSDimitry Andric auto bytes_written = As<long long>(m_py_obj.CallMethod("write", pybuffer)); 13119dba64beSDimitry Andric if (!bytes_written) 13129dba64beSDimitry Andric return Status(bytes_written.takeError()); 13139dba64beSDimitry Andric if (bytes_written.get() < 0) 13149dba64beSDimitry Andric return Status(".write() method returned a negative number!"); 13159dba64beSDimitry Andric static_assert(sizeof(long long) >= sizeof(size_t), "overflow"); 13169dba64beSDimitry Andric num_bytes = bytes_written.get(); 13179dba64beSDimitry Andric return Status(); 13189dba64beSDimitry Andric } 13199dba64beSDimitry Andric 13209dba64beSDimitry Andric Status Read(void *buf, size_t &num_bytes) override { 13219dba64beSDimitry Andric GIL takeGIL; 13229dba64beSDimitry Andric static_assert(sizeof(long long) >= sizeof(size_t), "overflow"); 13239dba64beSDimitry Andric auto pybuffer_obj = 13249dba64beSDimitry Andric m_py_obj.CallMethod("read", (unsigned long long)num_bytes); 13259dba64beSDimitry Andric if (!pybuffer_obj) 13269dba64beSDimitry Andric return Status(pybuffer_obj.takeError()); 13279dba64beSDimitry Andric num_bytes = 0; 13289dba64beSDimitry Andric if (pybuffer_obj.get().IsNone()) { 13299dba64beSDimitry Andric // EOF 13309dba64beSDimitry Andric num_bytes = 0; 13319dba64beSDimitry Andric return Status(); 13329dba64beSDimitry Andric } 13339dba64beSDimitry Andric auto pybuffer = PythonBuffer::Create(pybuffer_obj.get()); 13349dba64beSDimitry Andric if (!pybuffer) 13359dba64beSDimitry Andric return Status(pybuffer.takeError()); 13369dba64beSDimitry Andric memcpy(buf, pybuffer.get().get().buf, pybuffer.get().get().len); 13379dba64beSDimitry Andric num_bytes = pybuffer.get().get().len; 13389dba64beSDimitry Andric return Status(); 13399dba64beSDimitry Andric } 13409dba64beSDimitry Andric }; 13419dba64beSDimitry Andric } // namespace 13429dba64beSDimitry Andric 13439dba64beSDimitry Andric namespace { 13449dba64beSDimitry Andric class TextPythonFile : public PythonIOFile { 13459dba64beSDimitry Andric protected: 13469dba64beSDimitry Andric int m_descriptor; 13479dba64beSDimitry Andric 13489dba64beSDimitry Andric public: 13499dba64beSDimitry Andric TextPythonFile(int fd, const PythonFile &file, bool borrowed) 13509dba64beSDimitry Andric : PythonIOFile(file, borrowed), 13519dba64beSDimitry Andric m_descriptor(File::DescriptorIsValid(fd) ? fd 13529dba64beSDimitry Andric : File::kInvalidDescriptor) {} 13539dba64beSDimitry Andric 13549dba64beSDimitry Andric int GetDescriptor() const override { return m_descriptor; } 13559dba64beSDimitry Andric 13569dba64beSDimitry Andric Status Write(const void *buf, size_t &num_bytes) override { 13579dba64beSDimitry Andric GIL takeGIL; 13589dba64beSDimitry Andric auto pystring = 13599dba64beSDimitry Andric PythonString::FromUTF8(llvm::StringRef((const char *)buf, num_bytes)); 13609dba64beSDimitry Andric if (!pystring) 13619dba64beSDimitry Andric return Status(pystring.takeError()); 13629dba64beSDimitry Andric num_bytes = 0; 13639dba64beSDimitry Andric auto bytes_written = 13649dba64beSDimitry Andric As<long long>(m_py_obj.CallMethod("write", pystring.get())); 13659dba64beSDimitry Andric if (!bytes_written) 13669dba64beSDimitry Andric return Status(bytes_written.takeError()); 13679dba64beSDimitry Andric if (bytes_written.get() < 0) 13689dba64beSDimitry Andric return Status(".write() method returned a negative number!"); 13699dba64beSDimitry Andric static_assert(sizeof(long long) >= sizeof(size_t), "overflow"); 13709dba64beSDimitry Andric num_bytes = bytes_written.get(); 13719dba64beSDimitry Andric return Status(); 13729dba64beSDimitry Andric } 13739dba64beSDimitry Andric 13749dba64beSDimitry Andric Status Read(void *buf, size_t &num_bytes) override { 13759dba64beSDimitry Andric GIL takeGIL; 13769dba64beSDimitry Andric size_t num_chars = num_bytes / 6; 13779dba64beSDimitry Andric size_t orig_num_bytes = num_bytes; 13789dba64beSDimitry Andric num_bytes = 0; 13799dba64beSDimitry Andric if (orig_num_bytes < 6) { 13809dba64beSDimitry Andric return Status("can't read less than 6 bytes from a utf8 text stream"); 13819dba64beSDimitry Andric } 13829dba64beSDimitry Andric auto pystring = As<PythonString>( 13839dba64beSDimitry Andric m_py_obj.CallMethod("read", (unsigned long long)num_chars)); 13849dba64beSDimitry Andric if (!pystring) 13859dba64beSDimitry Andric return Status(pystring.takeError()); 13869dba64beSDimitry Andric if (pystring.get().IsNone()) { 13879dba64beSDimitry Andric // EOF 13889dba64beSDimitry Andric return Status(); 13899dba64beSDimitry Andric } 13909dba64beSDimitry Andric auto stringref = pystring.get().AsUTF8(); 13919dba64beSDimitry Andric if (!stringref) 13929dba64beSDimitry Andric return Status(stringref.takeError()); 13939dba64beSDimitry Andric num_bytes = stringref.get().size(); 13949dba64beSDimitry Andric memcpy(buf, stringref.get().begin(), num_bytes); 13959dba64beSDimitry Andric return Status(); 13969dba64beSDimitry Andric } 13979dba64beSDimitry Andric }; 13989dba64beSDimitry Andric } // namespace 13999dba64beSDimitry Andric 14009dba64beSDimitry Andric #endif 14019dba64beSDimitry Andric 14029dba64beSDimitry Andric llvm::Expected<FileSP> PythonFile::ConvertToFile(bool borrowed) { 14039dba64beSDimitry Andric if (!IsValid()) 14049dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 14059dba64beSDimitry Andric "invalid PythonFile"); 14069dba64beSDimitry Andric 14079dba64beSDimitry Andric int fd = PyObject_AsFileDescriptor(m_py_obj); 14089dba64beSDimitry Andric if (fd < 0) { 14099dba64beSDimitry Andric PyErr_Clear(); 14109dba64beSDimitry Andric return ConvertToFileForcingUseOfScriptingIOMethods(borrowed); 14119dba64beSDimitry Andric } 14129dba64beSDimitry Andric auto options = GetOptionsForPyObject(*this); 14139dba64beSDimitry Andric if (!options) 14149dba64beSDimitry Andric return options.takeError(); 14159dba64beSDimitry Andric 1416480093f4SDimitry Andric if (options.get() & File::eOpenOptionWrite) { 14179dba64beSDimitry Andric // LLDB and python will not share I/O buffers. We should probably 14189dba64beSDimitry Andric // flush the python buffers now. 14199dba64beSDimitry Andric auto r = CallMethod("flush"); 14209dba64beSDimitry Andric if (!r) 14219dba64beSDimitry Andric return r.takeError(); 1422480093f4SDimitry Andric } 14239dba64beSDimitry Andric 14249dba64beSDimitry Andric FileSP file_sp; 14259dba64beSDimitry Andric if (borrowed) { 14269dba64beSDimitry Andric // In this case we we don't need to retain the python 14279dba64beSDimitry Andric // object at all. 14289dba64beSDimitry Andric file_sp = std::make_shared<NativeFile>(fd, options.get(), false); 14299dba64beSDimitry Andric } else { 14309dba64beSDimitry Andric file_sp = std::static_pointer_cast<File>( 14319dba64beSDimitry Andric std::make_shared<SimplePythonFile>(*this, borrowed, fd, options.get())); 14329dba64beSDimitry Andric } 14339dba64beSDimitry Andric if (!file_sp->IsValid()) 14349dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 14359dba64beSDimitry Andric "invalid File"); 14369dba64beSDimitry Andric 14379dba64beSDimitry Andric return file_sp; 14389dba64beSDimitry Andric } 14399dba64beSDimitry Andric 14409dba64beSDimitry Andric llvm::Expected<FileSP> 14419dba64beSDimitry Andric PythonFile::ConvertToFileForcingUseOfScriptingIOMethods(bool borrowed) { 14429dba64beSDimitry Andric 14439dba64beSDimitry Andric assert(!PyErr_Occurred()); 14449dba64beSDimitry Andric 14459dba64beSDimitry Andric if (!IsValid()) 14469dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 14479dba64beSDimitry Andric "invalid PythonFile"); 14489dba64beSDimitry Andric 14499dba64beSDimitry Andric #if PY_MAJOR_VERSION < 3 14509dba64beSDimitry Andric 14519dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 14529dba64beSDimitry Andric "not supported on python 2"); 14539dba64beSDimitry Andric 14549dba64beSDimitry Andric #else 14559dba64beSDimitry Andric 14569dba64beSDimitry Andric int fd = PyObject_AsFileDescriptor(m_py_obj); 14579dba64beSDimitry Andric if (fd < 0) { 14589dba64beSDimitry Andric PyErr_Clear(); 14599dba64beSDimitry Andric fd = File::kInvalidDescriptor; 14609dba64beSDimitry Andric } 14619dba64beSDimitry Andric 14629dba64beSDimitry Andric auto io_module = PythonModule::Import("io"); 14639dba64beSDimitry Andric if (!io_module) 14649dba64beSDimitry Andric return io_module.takeError(); 14659dba64beSDimitry Andric auto textIOBase = io_module.get().Get("TextIOBase"); 14669dba64beSDimitry Andric if (!textIOBase) 14679dba64beSDimitry Andric return textIOBase.takeError(); 14689dba64beSDimitry Andric auto rawIOBase = io_module.get().Get("RawIOBase"); 14699dba64beSDimitry Andric if (!rawIOBase) 14709dba64beSDimitry Andric return rawIOBase.takeError(); 14719dba64beSDimitry Andric auto bufferedIOBase = io_module.get().Get("BufferedIOBase"); 14729dba64beSDimitry Andric if (!bufferedIOBase) 14739dba64beSDimitry Andric return bufferedIOBase.takeError(); 14749dba64beSDimitry Andric 14759dba64beSDimitry Andric FileSP file_sp; 14769dba64beSDimitry Andric 14779dba64beSDimitry Andric auto isTextIO = IsInstance(textIOBase.get()); 14789dba64beSDimitry Andric if (!isTextIO) 14799dba64beSDimitry Andric return isTextIO.takeError(); 14809dba64beSDimitry Andric if (isTextIO.get()) 14819dba64beSDimitry Andric file_sp = std::static_pointer_cast<File>( 14829dba64beSDimitry Andric std::make_shared<TextPythonFile>(fd, *this, borrowed)); 14839dba64beSDimitry Andric 14849dba64beSDimitry Andric auto isRawIO = IsInstance(rawIOBase.get()); 14859dba64beSDimitry Andric if (!isRawIO) 14869dba64beSDimitry Andric return isRawIO.takeError(); 14879dba64beSDimitry Andric auto isBufferedIO = IsInstance(bufferedIOBase.get()); 14889dba64beSDimitry Andric if (!isBufferedIO) 14899dba64beSDimitry Andric return isBufferedIO.takeError(); 14909dba64beSDimitry Andric 14919dba64beSDimitry Andric if (isRawIO.get() || isBufferedIO.get()) { 14929dba64beSDimitry Andric file_sp = std::static_pointer_cast<File>( 14939dba64beSDimitry Andric std::make_shared<BinaryPythonFile>(fd, *this, borrowed)); 14949dba64beSDimitry Andric } 14959dba64beSDimitry Andric 14969dba64beSDimitry Andric if (!file_sp) 14979dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 14989dba64beSDimitry Andric "python file is neither text nor binary"); 14999dba64beSDimitry Andric 15009dba64beSDimitry Andric if (!file_sp->IsValid()) 15019dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 15029dba64beSDimitry Andric "invalid File"); 15039dba64beSDimitry Andric 15049dba64beSDimitry Andric return file_sp; 15059dba64beSDimitry Andric 15069dba64beSDimitry Andric #endif 15079dba64beSDimitry Andric } 15089dba64beSDimitry Andric 15099dba64beSDimitry Andric Expected<PythonFile> PythonFile::FromFile(File &file, const char *mode) { 15109dba64beSDimitry Andric if (!file.IsValid()) 15119dba64beSDimitry Andric return llvm::createStringError(llvm::inconvertibleErrorCode(), 15129dba64beSDimitry Andric "invalid file"); 15139dba64beSDimitry Andric 15149dba64beSDimitry Andric if (auto *simple = llvm::dyn_cast<SimplePythonFile>(&file)) 15159dba64beSDimitry Andric return Retain<PythonFile>(simple->GetPythonObject()); 15169dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 15179dba64beSDimitry Andric if (auto *pythonio = llvm::dyn_cast<PythonIOFile>(&file)) 15189dba64beSDimitry Andric return Retain<PythonFile>(pythonio->GetPythonObject()); 15199dba64beSDimitry Andric #endif 15209dba64beSDimitry Andric 15219dba64beSDimitry Andric if (!mode) { 15229dba64beSDimitry Andric auto m = file.GetOpenMode(); 15239dba64beSDimitry Andric if (!m) 15249dba64beSDimitry Andric return m.takeError(); 15259dba64beSDimitry Andric mode = m.get(); 15269dba64beSDimitry Andric } 15279dba64beSDimitry Andric 15289dba64beSDimitry Andric PyObject *file_obj; 15299dba64beSDimitry Andric #if PY_MAJOR_VERSION >= 3 15309dba64beSDimitry Andric file_obj = PyFile_FromFd(file.GetDescriptor(), nullptr, mode, -1, nullptr, 1531480093f4SDimitry Andric "ignore", nullptr, /*closefd=*/0); 1532*0b57cec5SDimitry Andric #else 1533480093f4SDimitry Andric // I'd like to pass ::fflush here if the file is writable, so that 1534480093f4SDimitry Andric // when the python side destructs the file object it will be flushed. 1535480093f4SDimitry Andric // However, this would be dangerous. It can cause fflush to be called 1536480093f4SDimitry Andric // after fclose if the python program keeps a reference to the file after 1537480093f4SDimitry Andric // the original lldb_private::File has been destructed. 1538480093f4SDimitry Andric // 1539480093f4SDimitry Andric // It's all well and good to ask a python program not to use a closed file 1540480093f4SDimitry Andric // but asking a python program to make sure objects get released in a 1541480093f4SDimitry Andric // particular order is not safe. 1542480093f4SDimitry Andric // 1543480093f4SDimitry Andric // The tradeoff here is that if a python 2 program wants to make sure this 1544480093f4SDimitry Andric // file gets flushed, they'll have to do it explicitly or wait untill the 1545480093f4SDimitry Andric // original lldb File itself gets flushed. 1546480093f4SDimitry Andric file_obj = PyFile_FromFile(file.GetStream(), py2_const_cast(""), 1547480093f4SDimitry Andric py2_const_cast(mode), [](FILE *) { return 0; }); 1548*0b57cec5SDimitry Andric #endif 15499dba64beSDimitry Andric 15509dba64beSDimitry Andric if (!file_obj) 15519dba64beSDimitry Andric return exception(); 15529dba64beSDimitry Andric 15539dba64beSDimitry Andric return Take<PythonFile>(file_obj); 1554*0b57cec5SDimitry Andric } 1555*0b57cec5SDimitry Andric 15569dba64beSDimitry Andric Error PythonScript::Init() { 15579dba64beSDimitry Andric if (function.IsValid()) 15589dba64beSDimitry Andric return Error::success(); 1559*0b57cec5SDimitry Andric 15609dba64beSDimitry Andric PythonDictionary globals(PyInitialValue::Empty); 15619dba64beSDimitry Andric auto builtins = PythonModule::BuiltinsModule(); 15629dba64beSDimitry Andric if (Error error = globals.SetItem("__builtins__", builtins)) 15639dba64beSDimitry Andric return error; 15649dba64beSDimitry Andric PyObject *o = 15659dba64beSDimitry Andric PyRun_String(script, Py_file_input, globals.get(), globals.get()); 15669dba64beSDimitry Andric if (!o) 15679dba64beSDimitry Andric return exception(); 15689dba64beSDimitry Andric Take<PythonObject>(o); 15699dba64beSDimitry Andric auto f = As<PythonCallable>(globals.GetItem("main")); 15709dba64beSDimitry Andric if (!f) 15719dba64beSDimitry Andric return f.takeError(); 15729dba64beSDimitry Andric function = std::move(f.get()); 15739dba64beSDimitry Andric 15749dba64beSDimitry Andric return Error::success(); 1575*0b57cec5SDimitry Andric } 1576*0b57cec5SDimitry Andric 15779dba64beSDimitry Andric llvm::Expected<PythonObject> 15789dba64beSDimitry Andric python::runStringOneLine(const llvm::Twine &string, 15799dba64beSDimitry Andric const PythonDictionary &globals, 15809dba64beSDimitry Andric const PythonDictionary &locals) { 15819dba64beSDimitry Andric if (!globals.IsValid() || !locals.IsValid()) 15829dba64beSDimitry Andric return nullDeref(); 1583*0b57cec5SDimitry Andric 15849dba64beSDimitry Andric PyObject *code = 15859dba64beSDimitry Andric Py_CompileString(NullTerminated(string), "<string>", Py_eval_input); 15869dba64beSDimitry Andric if (!code) { 15879dba64beSDimitry Andric PyErr_Clear(); 15889dba64beSDimitry Andric code = 15899dba64beSDimitry Andric Py_CompileString(NullTerminated(string), "<string>", Py_single_input); 15909dba64beSDimitry Andric } 15919dba64beSDimitry Andric if (!code) 15929dba64beSDimitry Andric return exception(); 15939dba64beSDimitry Andric auto code_ref = Take<PythonObject>(code); 15949dba64beSDimitry Andric 15959dba64beSDimitry Andric #if PY_MAJOR_VERSION < 3 15969dba64beSDimitry Andric PyObject *result = 15979dba64beSDimitry Andric PyEval_EvalCode((PyCodeObject *)code, globals.get(), locals.get()); 15989dba64beSDimitry Andric #else 15999dba64beSDimitry Andric PyObject *result = PyEval_EvalCode(code, globals.get(), locals.get()); 16009dba64beSDimitry Andric #endif 16019dba64beSDimitry Andric 16029dba64beSDimitry Andric if (!result) 16039dba64beSDimitry Andric return exception(); 16049dba64beSDimitry Andric 16059dba64beSDimitry Andric return Take<PythonObject>(result); 16069dba64beSDimitry Andric } 16079dba64beSDimitry Andric 16089dba64beSDimitry Andric llvm::Expected<PythonObject> 16099dba64beSDimitry Andric python::runStringMultiLine(const llvm::Twine &string, 16109dba64beSDimitry Andric const PythonDictionary &globals, 16119dba64beSDimitry Andric const PythonDictionary &locals) { 16129dba64beSDimitry Andric if (!globals.IsValid() || !locals.IsValid()) 16139dba64beSDimitry Andric return nullDeref(); 16149dba64beSDimitry Andric PyObject *result = PyRun_String(NullTerminated(string), Py_file_input, 16159dba64beSDimitry Andric globals.get(), locals.get()); 16169dba64beSDimitry Andric if (!result) 16179dba64beSDimitry Andric return exception(); 16189dba64beSDimitry Andric return Take<PythonObject>(result); 1619*0b57cec5SDimitry Andric } 1620*0b57cec5SDimitry Andric 1621*0b57cec5SDimitry Andric #endif 1622