Permalink
Cannot retrieve contributors at this time
1207 lines (1065 sloc)
34.7 KB
| /* Traceback implementation */ | |
| #include "Python.h" | |
| #include "code.h" // PyCode_Addr2Line etc | |
| #include "frameobject.h" // PyFrame_GetBack() | |
| #include "pycore_ast.h" // asdl_seq_* | |
| #include "pycore_compile.h" // _PyAST_Optimize | |
| #include "pycore_fileutils.h" // _Py_BEGIN_SUPPRESS_IPH | |
| #include "pycore_frame.h" // _PyFrame_GetCode() | |
| #include "pycore_interp.h" // PyInterpreterState.gc | |
| #include "pycore_parser.h" // _PyParser_ASTFromString | |
| #include "pycore_pyarena.h" // _PyArena_Free() | |
| #include "pycore_pyerrors.h" // _PyErr_Fetch() | |
| #include "pycore_pystate.h" // _PyThreadState_GET() | |
| #include "../Parser/pegen.h" // _PyPegen_byte_offset_to_character_offset() | |
| #include "structmember.h" // PyMemberDef | |
| #include "osdefs.h" // SEP | |
| #ifdef HAVE_FCNTL_H | |
| # include <fcntl.h> | |
| #endif | |
| #define OFF(x) offsetof(PyTracebackObject, x) | |
| #define PUTS(fd, str) _Py_write_noraise(fd, str, (int)strlen(str)) | |
| #define MAX_STRING_LENGTH 500 | |
| #define MAX_FRAME_DEPTH 100 | |
| #define MAX_NTHREADS 100 | |
| /* Function from Parser/tokenizer.c */ | |
| extern char* _PyTokenizer_FindEncodingFilename(int, PyObject *); | |
| _Py_IDENTIFIER(TextIOWrapper); | |
| _Py_IDENTIFIER(close); | |
| _Py_IDENTIFIER(open); | |
| _Py_IDENTIFIER(path); | |
| /*[clinic input] | |
| class TracebackType "PyTracebackObject *" "&PyTraceback_Type" | |
| [clinic start generated code]*/ | |
| /*[clinic end generated code: output=da39a3ee5e6b4b0d input=928fa06c10151120]*/ | |
| #include "clinic/traceback.c.h" | |
| static PyObject * | |
| tb_create_raw(PyTracebackObject *next, PyFrameObject *frame, int lasti, | |
| int lineno) | |
| { | |
| PyTracebackObject *tb; | |
| if ((next != NULL && !PyTraceBack_Check(next)) || | |
| frame == NULL || !PyFrame_Check(frame)) { | |
| PyErr_BadInternalCall(); | |
| return NULL; | |
| } | |
| tb = PyObject_GC_New(PyTracebackObject, &PyTraceBack_Type); | |
| if (tb != NULL) { | |
| Py_XINCREF(next); | |
| tb->tb_next = next; | |
| Py_XINCREF(frame); | |
| tb->tb_frame = frame; | |
| tb->tb_lasti = lasti; | |
| tb->tb_lineno = lineno; | |
| PyObject_GC_Track(tb); | |
| } | |
| return (PyObject *)tb; | |
| } | |
| /*[clinic input] | |
| @classmethod | |
| TracebackType.__new__ as tb_new | |
| tb_next: object | |
| tb_frame: object(type='PyFrameObject *', subclass_of='&PyFrame_Type') | |
| tb_lasti: int | |
| tb_lineno: int | |
| Create a new traceback object. | |
| [clinic start generated code]*/ | |
| static PyObject * | |
| tb_new_impl(PyTypeObject *type, PyObject *tb_next, PyFrameObject *tb_frame, | |
| int tb_lasti, int tb_lineno) | |
| /*[clinic end generated code: output=fa077debd72d861a input=01cbe8ec8783fca7]*/ | |
| { | |
| if (tb_next == Py_None) { | |
| tb_next = NULL; | |
| } else if (!PyTraceBack_Check(tb_next)) { | |
| return PyErr_Format(PyExc_TypeError, | |
| "expected traceback object or None, got '%s'", | |
| Py_TYPE(tb_next)->tp_name); | |
| } | |
| return tb_create_raw((PyTracebackObject *)tb_next, tb_frame, tb_lasti, | |
| tb_lineno); | |
| } | |
| static PyObject * | |
| tb_dir(PyTracebackObject *self, PyObject *Py_UNUSED(ignored)) | |
| { | |
| return Py_BuildValue("[ssss]", "tb_frame", "tb_next", | |
| "tb_lasti", "tb_lineno"); | |
| } | |
| static PyObject * | |
| tb_next_get(PyTracebackObject *self, void *Py_UNUSED(_)) | |
| { | |
| PyObject* ret = (PyObject*)self->tb_next; | |
| if (!ret) { | |
| ret = Py_None; | |
| } | |
| Py_INCREF(ret); | |
| return ret; | |
| } | |
| static int | |
| tb_next_set(PyTracebackObject *self, PyObject *new_next, void *Py_UNUSED(_)) | |
| { | |
| if (!new_next) { | |
| PyErr_Format(PyExc_TypeError, "can't delete tb_next attribute"); | |
| return -1; | |
| } | |
| /* We accept None or a traceback object, and map None -> NULL (inverse of | |
| tb_next_get) */ | |
| if (new_next == Py_None) { | |
| new_next = NULL; | |
| } else if (!PyTraceBack_Check(new_next)) { | |
| PyErr_Format(PyExc_TypeError, | |
| "expected traceback object, got '%s'", | |
| Py_TYPE(new_next)->tp_name); | |
| return -1; | |
| } | |
| /* Check for loops */ | |
| PyTracebackObject *cursor = (PyTracebackObject *)new_next; | |
| while (cursor) { | |
| if (cursor == self) { | |
| PyErr_Format(PyExc_ValueError, "traceback loop detected"); | |
| return -1; | |
| } | |
| cursor = cursor->tb_next; | |
| } | |
| PyObject *old_next = (PyObject*)self->tb_next; | |
| Py_XINCREF(new_next); | |
| self->tb_next = (PyTracebackObject *)new_next; | |
| Py_XDECREF(old_next); | |
| return 0; | |
| } | |
| static PyMethodDef tb_methods[] = { | |
| {"__dir__", (PyCFunction)tb_dir, METH_NOARGS}, | |
| {NULL, NULL, 0, NULL}, | |
| }; | |
| static PyMemberDef tb_memberlist[] = { | |
| {"tb_frame", T_OBJECT, OFF(tb_frame), READONLY|PY_AUDIT_READ}, | |
| {"tb_lasti", T_INT, OFF(tb_lasti), READONLY}, | |
| {"tb_lineno", T_INT, OFF(tb_lineno), READONLY}, | |
| {NULL} /* Sentinel */ | |
| }; | |
| static PyGetSetDef tb_getsetters[] = { | |
| {"tb_next", (getter)tb_next_get, (setter)tb_next_set, NULL, NULL}, | |
| {NULL} /* Sentinel */ | |
| }; | |
| static void | |
| tb_dealloc(PyTracebackObject *tb) | |
| { | |
| PyObject_GC_UnTrack(tb); | |
| Py_TRASHCAN_BEGIN(tb, tb_dealloc) | |
| Py_XDECREF(tb->tb_next); | |
| Py_XDECREF(tb->tb_frame); | |
| PyObject_GC_Del(tb); | |
| Py_TRASHCAN_END | |
| } | |
| static int | |
| tb_traverse(PyTracebackObject *tb, visitproc visit, void *arg) | |
| { | |
| Py_VISIT(tb->tb_next); | |
| Py_VISIT(tb->tb_frame); | |
| return 0; | |
| } | |
| static int | |
| tb_clear(PyTracebackObject *tb) | |
| { | |
| Py_CLEAR(tb->tb_next); | |
| Py_CLEAR(tb->tb_frame); | |
| return 0; | |
| } | |
| PyTypeObject PyTraceBack_Type = { | |
| PyVarObject_HEAD_INIT(&PyType_Type, 0) | |
| "traceback", | |
| sizeof(PyTracebackObject), | |
| 0, | |
| (destructor)tb_dealloc, /*tp_dealloc*/ | |
| 0, /*tp_vectorcall_offset*/ | |
| 0, /*tp_getattr*/ | |
| 0, /*tp_setattr*/ | |
| 0, /*tp_as_async*/ | |
| 0, /*tp_repr*/ | |
| 0, /*tp_as_number*/ | |
| 0, /*tp_as_sequence*/ | |
| 0, /*tp_as_mapping*/ | |
| 0, /* tp_hash */ | |
| 0, /* tp_call */ | |
| 0, /* tp_str */ | |
| PyObject_GenericGetAttr, /* tp_getattro */ | |
| 0, /* tp_setattro */ | |
| 0, /* tp_as_buffer */ | |
| Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */ | |
| tb_new__doc__, /* tp_doc */ | |
| (traverseproc)tb_traverse, /* tp_traverse */ | |
| (inquiry)tb_clear, /* tp_clear */ | |
| 0, /* tp_richcompare */ | |
| 0, /* tp_weaklistoffset */ | |
| 0, /* tp_iter */ | |
| 0, /* tp_iternext */ | |
| tb_methods, /* tp_methods */ | |
| tb_memberlist, /* tp_members */ | |
| tb_getsetters, /* tp_getset */ | |
| 0, /* tp_base */ | |
| 0, /* tp_dict */ | |
| 0, /* tp_descr_get */ | |
| 0, /* tp_descr_set */ | |
| 0, /* tp_dictoffset */ | |
| 0, /* tp_init */ | |
| 0, /* tp_alloc */ | |
| tb_new, /* tp_new */ | |
| }; | |
| PyObject* | |
| _PyTraceBack_FromFrame(PyObject *tb_next, PyFrameObject *frame) | |
| { | |
| assert(tb_next == NULL || PyTraceBack_Check(tb_next)); | |
| assert(frame != NULL); | |
| return tb_create_raw((PyTracebackObject *)tb_next, frame, frame->f_frame->f_lasti*sizeof(_Py_CODEUNIT), | |
| PyFrame_GetLineNumber(frame)); | |
| } | |
| int | |
| PyTraceBack_Here(PyFrameObject *frame) | |
| { | |
| PyObject *exc, *val, *tb, *newtb; | |
| PyErr_Fetch(&exc, &val, &tb); | |
| newtb = _PyTraceBack_FromFrame(tb, frame); | |
| if (newtb == NULL) { | |
| _PyErr_ChainExceptions(exc, val, tb); | |
| return -1; | |
| } | |
| PyErr_Restore(exc, val, newtb); | |
| Py_XDECREF(tb); | |
| return 0; | |
| } | |
| /* Insert a frame into the traceback for (funcname, filename, lineno). */ | |
| void _PyTraceback_Add(const char *funcname, const char *filename, int lineno) | |
| { | |
| PyObject *globals; | |
| PyCodeObject *code; | |
| PyFrameObject *frame; | |
| PyObject *exc, *val, *tb; | |
| PyThreadState *tstate = _PyThreadState_GET(); | |
| /* Save and clear the current exception. Python functions must not be | |
| called with an exception set. Calling Python functions happens when | |
| the codec of the filesystem encoding is implemented in pure Python. */ | |
| _PyErr_Fetch(tstate, &exc, &val, &tb); | |
| globals = PyDict_New(); | |
| if (!globals) | |
| goto error; | |
| code = PyCode_NewEmpty(filename, funcname, lineno); | |
| if (!code) { | |
| Py_DECREF(globals); | |
| goto error; | |
| } | |
| frame = PyFrame_New(tstate, code, globals, NULL); | |
| Py_DECREF(globals); | |
| Py_DECREF(code); | |
| if (!frame) | |
| goto error; | |
| frame->f_lineno = lineno; | |
| _PyErr_Restore(tstate, exc, val, tb); | |
| PyTraceBack_Here(frame); | |
| Py_DECREF(frame); | |
| return; | |
| error: | |
| _PyErr_ChainExceptions(exc, val, tb); | |
| } | |
| static PyObject * | |
| _Py_FindSourceFile(PyObject *filename, char* namebuf, size_t namelen, PyObject *io) | |
| { | |
| Py_ssize_t i; | |
| PyObject *binary; | |
| PyObject *v; | |
| Py_ssize_t npath; | |
| size_t taillen; | |
| PyObject *syspath; | |
| PyObject *path; | |
| const char* tail; | |
| PyObject *filebytes; | |
| const char* filepath; | |
| Py_ssize_t len; | |
| PyObject* result; | |
| filebytes = PyUnicode_EncodeFSDefault(filename); | |
| if (filebytes == NULL) { | |
| PyErr_Clear(); | |
| return NULL; | |
| } | |
| filepath = PyBytes_AS_STRING(filebytes); | |
| /* Search tail of filename in sys.path before giving up */ | |
| tail = strrchr(filepath, SEP); | |
| if (tail == NULL) | |
| tail = filepath; | |
| else | |
| tail++; | |
| taillen = strlen(tail); | |
| syspath = _PySys_GetObjectId(&PyId_path); | |
| if (syspath == NULL || !PyList_Check(syspath)) | |
| goto error; | |
| npath = PyList_Size(syspath); | |
| for (i = 0; i < npath; i++) { | |
| v = PyList_GetItem(syspath, i); | |
| if (v == NULL) { | |
| PyErr_Clear(); | |
| break; | |
| } | |
| if (!PyUnicode_Check(v)) | |
| continue; | |
| path = PyUnicode_EncodeFSDefault(v); | |
| if (path == NULL) { | |
| PyErr_Clear(); | |
| continue; | |
| } | |
| len = PyBytes_GET_SIZE(path); | |
| if (len + 1 + (Py_ssize_t)taillen >= (Py_ssize_t)namelen - 1) { | |
| Py_DECREF(path); | |
| continue; /* Too long */ | |
| } | |
| strcpy(namebuf, PyBytes_AS_STRING(path)); | |
| Py_DECREF(path); | |
| if (strlen(namebuf) != (size_t)len) | |
| continue; /* v contains '\0' */ | |
| if (len > 0 && namebuf[len-1] != SEP) | |
| namebuf[len++] = SEP; | |
| strcpy(namebuf+len, tail); | |
| binary = _PyObject_CallMethodId(io, &PyId_open, "ss", namebuf, "rb"); | |
| if (binary != NULL) { | |
| result = binary; | |
| goto finally; | |
| } | |
| PyErr_Clear(); | |
| } | |
| goto error; | |
| error: | |
| result = NULL; | |
| finally: | |
| Py_DECREF(filebytes); | |
| return result; | |
| } | |
| int | |
| _Py_DisplaySourceLine(PyObject *f, PyObject *filename, int lineno, int indent, int *truncation, PyObject **line) | |
| { | |
| int err = 0; | |
| int fd; | |
| int i; | |
| char *found_encoding; | |
| const char *encoding; | |
| PyObject *io; | |
| PyObject *binary; | |
| PyObject *fob = NULL; | |
| PyObject *lineobj = NULL; | |
| PyObject *res; | |
| char buf[MAXPATHLEN+1]; | |
| int kind; | |
| const void *data; | |
| /* open the file */ | |
| if (filename == NULL) | |
| return 0; | |
| /* Do not attempt to open things like <string> or <stdin> */ | |
| assert(PyUnicode_Check(filename)); | |
| if (PyUnicode_READ_CHAR(filename, 0) == '<') { | |
| Py_ssize_t len = PyUnicode_GET_LENGTH(filename); | |
| if (len > 0 && PyUnicode_READ_CHAR(filename, len - 1) == '>') { | |
| return 0; | |
| } | |
| } | |
| io = PyImport_ImportModuleNoBlock("io"); | |
| if (io == NULL) | |
| return -1; | |
| binary = _PyObject_CallMethodId(io, &PyId_open, "Os", filename, "rb"); | |
| if (binary == NULL) { | |
| PyErr_Clear(); | |
| binary = _Py_FindSourceFile(filename, buf, sizeof(buf), io); | |
| if (binary == NULL) { | |
| Py_DECREF(io); | |
| return -1; | |
| } | |
| } | |
| /* use the right encoding to decode the file as unicode */ | |
| fd = PyObject_AsFileDescriptor(binary); | |
| if (fd < 0) { | |
| Py_DECREF(io); | |
| Py_DECREF(binary); | |
| return 0; | |
| } | |
| found_encoding = _PyTokenizer_FindEncodingFilename(fd, filename); | |
| if (found_encoding == NULL) | |
| PyErr_Clear(); | |
| encoding = (found_encoding != NULL) ? found_encoding : "utf-8"; | |
| /* Reset position */ | |
| if (lseek(fd, 0, SEEK_SET) == (off_t)-1) { | |
| Py_DECREF(io); | |
| Py_DECREF(binary); | |
| PyMem_Free(found_encoding); | |
| return 0; | |
| } | |
| fob = _PyObject_CallMethodId(io, &PyId_TextIOWrapper, "Os", binary, encoding); | |
| Py_DECREF(io); | |
| PyMem_Free(found_encoding); | |
| if (fob == NULL) { | |
| PyErr_Clear(); | |
| res = _PyObject_CallMethodIdNoArgs(binary, &PyId_close); | |
| Py_DECREF(binary); | |
| if (res) | |
| Py_DECREF(res); | |
| else | |
| PyErr_Clear(); | |
| return 0; | |
| } | |
| Py_DECREF(binary); | |
| /* get the line number lineno */ | |
| for (i = 0; i < lineno; i++) { | |
| Py_XDECREF(lineobj); | |
| lineobj = PyFile_GetLine(fob, -1); | |
| if (!lineobj) { | |
| PyErr_Clear(); | |
| err = -1; | |
| break; | |
| } | |
| } | |
| res = _PyObject_CallMethodIdNoArgs(fob, &PyId_close); | |
| if (res) | |
| Py_DECREF(res); | |
| else | |
| PyErr_Clear(); | |
| Py_DECREF(fob); | |
| if (!lineobj || !PyUnicode_Check(lineobj)) { | |
| Py_XDECREF(lineobj); | |
| return err; | |
| } | |
| if (line) { | |
| Py_INCREF(lineobj); | |
| *line = lineobj; | |
| } | |
| /* remove the indentation of the line */ | |
| kind = PyUnicode_KIND(lineobj); | |
| data = PyUnicode_DATA(lineobj); | |
| for (i=0; i < PyUnicode_GET_LENGTH(lineobj); i++) { | |
| Py_UCS4 ch = PyUnicode_READ(kind, data, i); | |
| if (ch != ' ' && ch != '\t' && ch != '\014') | |
| break; | |
| } | |
| if (i) { | |
| PyObject *truncated; | |
| truncated = PyUnicode_Substring(lineobj, i, PyUnicode_GET_LENGTH(lineobj)); | |
| if (truncated) { | |
| Py_DECREF(lineobj); | |
| lineobj = truncated; | |
| } else { | |
| PyErr_Clear(); | |
| } | |
| } | |
| if (truncation != NULL) { | |
| *truncation = i - indent; | |
| } | |
| /* Write some spaces before the line */ | |
| strcpy(buf, " "); | |
| assert (strlen(buf) == 10); | |
| while (indent > 0) { | |
| if (indent < 10) | |
| buf[indent] = '\0'; | |
| err = PyFile_WriteString(buf, f); | |
| if (err != 0) | |
| break; | |
| indent -= 10; | |
| } | |
| /* finally display the line */ | |
| if (err == 0) | |
| err = PyFile_WriteObject(lineobj, f, Py_PRINT_RAW); | |
| Py_DECREF(lineobj); | |
| if (err == 0) | |
| err = PyFile_WriteString("\n", f); | |
| return err; | |
| } | |
| /* AST based Traceback Specialization | |
| * | |
| * When displaying a new traceback line, for certain syntactical constructs | |
| * (e.g a subscript, an arithmetic operation) we try to create a representation | |
| * that separates the primary source of error from the rest. | |
| * | |
| * Example specialization of BinOp nodes: | |
| * Traceback (most recent call last): | |
| * File "/home/isidentical/cpython/cpython/t.py", line 10, in <module> | |
| * add_values(1, 2, 'x', 3, 4) | |
| * ^^^^^^^^^^^^^^^^^^^^^^^^^^^ | |
| * File "/home/isidentical/cpython/cpython/t.py", line 2, in add_values | |
| * return a + b + c + d + e | |
| * ~~~~~~^~~ | |
| * TypeError: 'NoneType' object is not subscriptable | |
| */ | |
| #define IS_WHITESPACE(c) (((c) == ' ') || ((c) == '\t') || ((c) == '\f')) | |
| static int | |
| extract_anchors_from_expr(const char *segment_str, expr_ty expr, Py_ssize_t *left_anchor, Py_ssize_t *right_anchor, | |
| char** primary_error_char, char** secondary_error_char) | |
| { | |
| switch (expr->kind) { | |
| case BinOp_kind: { | |
| expr_ty left = expr->v.BinOp.left; | |
| expr_ty right = expr->v.BinOp.right; | |
| for (int i = left->end_col_offset; i < right->col_offset; i++) { | |
| if (IS_WHITESPACE(segment_str[i])) { | |
| continue; | |
| } | |
| *left_anchor = i; | |
| *right_anchor = i + 1; | |
| // Check whether if this a two-character operator (e.g //) | |
| if (i + 1 < right->col_offset && !IS_WHITESPACE(segment_str[i + 1])) { | |
| ++*right_anchor; | |
| } | |
| // Set the error characters | |
| *primary_error_char = "~"; | |
| *secondary_error_char = "^"; | |
| break; | |
| } | |
| return 1; | |
| } | |
| case Subscript_kind: { | |
| *left_anchor = expr->v.Subscript.value->end_col_offset; | |
| *right_anchor = expr->v.Subscript.slice->end_col_offset + 1; | |
| // Set the error characters | |
| *primary_error_char = "~"; | |
| *secondary_error_char = "^"; | |
| return 1; | |
| } | |
| default: | |
| return 0; | |
| } | |
| } | |
| static int | |
| extract_anchors_from_stmt(const char *segment_str, stmt_ty statement, Py_ssize_t *left_anchor, Py_ssize_t *right_anchor, | |
| char** primary_error_char, char** secondary_error_char) | |
| { | |
| switch (statement->kind) { | |
| case Expr_kind: { | |
| return extract_anchors_from_expr(segment_str, statement->v.Expr.value, left_anchor, right_anchor, | |
| primary_error_char, secondary_error_char); | |
| } | |
| default: | |
| return 0; | |
| } | |
| } | |
| static int | |
| extract_anchors_from_line(PyObject *filename, PyObject *line, | |
| Py_ssize_t start_offset, Py_ssize_t end_offset, | |
| Py_ssize_t *left_anchor, Py_ssize_t *right_anchor, | |
| char** primary_error_char, char** secondary_error_char) | |
| { | |
| int res = -1; | |
| PyArena *arena = NULL; | |
| PyObject *segment = PyUnicode_Substring(line, start_offset, end_offset); | |
| if (!segment) { | |
| goto done; | |
| } | |
| const char *segment_str = PyUnicode_AsUTF8(segment); | |
| if (!segment_str) { | |
| goto done; | |
| } | |
| arena = _PyArena_New(); | |
| if (!arena) { | |
| goto done; | |
| } | |
| PyCompilerFlags flags = _PyCompilerFlags_INIT; | |
| _PyASTOptimizeState state; | |
| state.optimize = _Py_GetConfig()->optimization_level; | |
| state.ff_features = 0; | |
| mod_ty module = _PyParser_ASTFromString(segment_str, filename, Py_file_input, | |
| &flags, arena); | |
| if (!module) { | |
| goto done; | |
| } | |
| if (!_PyAST_Optimize(module, arena, &state)) { | |
| goto done; | |
| } | |
| assert(module->kind == Module_kind); | |
| if (asdl_seq_LEN(module->v.Module.body) == 1) { | |
| stmt_ty statement = asdl_seq_GET(module->v.Module.body, 0); | |
| res = extract_anchors_from_stmt(segment_str, statement, left_anchor, right_anchor, | |
| primary_error_char, secondary_error_char); | |
| } else { | |
| res = 0; | |
| } | |
| done: | |
| if (res > 0) { | |
| *left_anchor += start_offset; | |
| *right_anchor += start_offset; | |
| } | |
| Py_XDECREF(segment); | |
| if (arena) { | |
| _PyArena_Free(arena); | |
| } | |
| return res; | |
| } | |
| #define _TRACEBACK_SOURCE_LINE_INDENT 4 | |
| static inline int | |
| ignore_source_errors(void) { | |
| if (PyErr_Occurred()) { | |
| if (PyErr_ExceptionMatches(PyExc_KeyboardInterrupt)) { | |
| return -1; | |
| } | |
| PyErr_Clear(); | |
| } | |
| return 0; | |
| } | |
| static inline int | |
| print_error_location_carets(PyObject *f, int offset, Py_ssize_t start_offset, Py_ssize_t end_offset, | |
| Py_ssize_t right_start_offset, Py_ssize_t left_end_offset, | |
| const char *primary, const char *secondary) { | |
| int err = 0; | |
| int special_chars = (left_end_offset != -1 || right_start_offset != -1); | |
| while (++offset <= end_offset) { | |
| if (offset <= start_offset || offset > end_offset) { | |
| err = PyFile_WriteString(" ", f); | |
| } else if (special_chars && left_end_offset < offset && offset <= right_start_offset) { | |
| err = PyFile_WriteString(secondary, f); | |
| } else { | |
| err = PyFile_WriteString(primary, f); | |
| } | |
| } | |
| err = PyFile_WriteString("\n", f); | |
| return err; | |
| } | |
| static int | |
| tb_displayline(PyTracebackObject* tb, PyObject *f, PyObject *filename, int lineno, | |
| PyFrameObject *frame, PyObject *name) | |
| { | |
| int err; | |
| PyObject *line; | |
| if (filename == NULL || name == NULL) | |
| return -1; | |
| line = PyUnicode_FromFormat(" File \"%U\", line %d, in %U\n", | |
| filename, lineno, name); | |
| if (line == NULL) | |
| return -1; | |
| err = PyFile_WriteObject(line, f, Py_PRINT_RAW); | |
| Py_DECREF(line); | |
| if (err != 0) | |
| return err; | |
| int truncation = _TRACEBACK_SOURCE_LINE_INDENT; | |
| PyObject* source_line = NULL; | |
| if (_Py_DisplaySourceLine(f, filename, lineno, _TRACEBACK_SOURCE_LINE_INDENT, | |
| &truncation, &source_line) != 0 || !source_line) { | |
| /* ignore errors since we can't report them, can we? */ | |
| err = ignore_source_errors(); | |
| goto done; | |
| } | |
| int code_offset = tb->tb_lasti; | |
| PyCodeObject* code = frame->f_frame->f_code; | |
| int start_line; | |
| int end_line; | |
| int start_col_byte_offset; | |
| int end_col_byte_offset; | |
| if (!PyCode_Addr2Location(code, code_offset, &start_line, &start_col_byte_offset, | |
| &end_line, &end_col_byte_offset)) { | |
| goto done; | |
| } | |
| if (start_line < 0 || end_line < 0 | |
| || start_col_byte_offset < 0 | |
| || end_col_byte_offset < 0) | |
| { | |
| goto done; | |
| } | |
| // When displaying errors, we will use the following generic structure: | |
| // | |
| // ERROR LINE ERROR LINE ERROR LINE ERROR LINE ERROR LINE ERROR LINE ERROR LINE | |
| // ~~~~~~~~~~~~~~~^^^^^^^^^^^^^^^^^^^^^^^^^~~~~~~~~~~~~~~~~~~~ | |
| // | |-> left_end_offset | |-> left_offset | |
| // |-> start_offset |-> right_start_offset | |
| // | |
| // In general we will only have (start_offset, end_offset) but we can gather more information | |
| // by analyzing the AST of the text between *start_offset* and *end_offset*. If this succeeds | |
| // we could get *left_end_offset* and *right_start_offset* and some selection of characters for | |
| // the different ranges (primary_error_char and secondary_error_char). If we cannot obtain the | |
| // AST information or we cannot identify special ranges within it, then left_end_offset and | |
| // right_end_offset will be set to -1. | |
| // Convert the utf-8 byte offset to the actual character offset so we print the right number of carets. | |
| assert(source_line); | |
| Py_ssize_t start_offset = _PyPegen_byte_offset_to_character_offset(source_line, start_col_byte_offset); | |
| if (start_offset < 0) { | |
| err = ignore_source_errors() < 0; | |
| goto done; | |
| } | |
| Py_ssize_t end_offset = _PyPegen_byte_offset_to_character_offset(source_line, end_col_byte_offset); | |
| if (end_offset < 0) { | |
| err = ignore_source_errors() < 0; | |
| goto done; | |
| } | |
| Py_ssize_t left_end_offset = -1; | |
| Py_ssize_t right_start_offset = -1; | |
| char *primary_error_char = "^"; | |
| char *secondary_error_char = primary_error_char; | |
| if (start_line == end_line) { | |
| int res = extract_anchors_from_line(filename, source_line, start_offset, end_offset, | |
| &left_end_offset, &right_start_offset, | |
| &primary_error_char, &secondary_error_char); | |
| if (res < 0 && ignore_source_errors() < 0) { | |
| goto done; | |
| } | |
| } | |
| else { | |
| // If this is a multi-line expression, then we will highlight until | |
| // the last non-whitespace character. | |
| const char *source_line_str = PyUnicode_AsUTF8(source_line); | |
| if (!source_line_str) { | |
| goto done; | |
| } | |
| Py_ssize_t i = PyUnicode_GET_LENGTH(source_line); | |
| while (--i >= 0) { | |
| if (!IS_WHITESPACE(source_line_str[i])) { | |
| break; | |
| } | |
| } | |
| end_offset = i + 1; | |
| } | |
| err = print_error_location_carets(f, truncation, start_offset, end_offset, | |
| right_start_offset, left_end_offset, | |
| primary_error_char, secondary_error_char); | |
| done: | |
| Py_XDECREF(source_line); | |
| return err; | |
| } | |
| static const int TB_RECURSIVE_CUTOFF = 3; // Also hardcoded in traceback.py. | |
| static int | |
| tb_print_line_repeated(PyObject *f, long cnt) | |
| { | |
| cnt -= TB_RECURSIVE_CUTOFF; | |
| PyObject *line = PyUnicode_FromFormat( | |
| (cnt > 1) | |
| ? " [Previous line repeated %ld more times]\n" | |
| : " [Previous line repeated %ld more time]\n", | |
| cnt); | |
| if (line == NULL) { | |
| return -1; | |
| } | |
| int err = PyFile_WriteObject(line, f, Py_PRINT_RAW); | |
| Py_DECREF(line); | |
| return err; | |
| } | |
| static int | |
| tb_printinternal(PyTracebackObject *tb, PyObject *f, long limit) | |
| { | |
| int err = 0; | |
| Py_ssize_t depth = 0; | |
| PyObject *last_file = NULL; | |
| int last_line = -1; | |
| PyObject *last_name = NULL; | |
| long cnt = 0; | |
| PyTracebackObject *tb1 = tb; | |
| while (tb1 != NULL) { | |
| depth++; | |
| tb1 = tb1->tb_next; | |
| } | |
| while (tb != NULL && depth > limit) { | |
| depth--; | |
| tb = tb->tb_next; | |
| } | |
| while (tb != NULL && err == 0) { | |
| PyCodeObject *code = PyFrame_GetCode(tb->tb_frame); | |
| if (last_file == NULL || | |
| code->co_filename != last_file || | |
| last_line == -1 || tb->tb_lineno != last_line || | |
| last_name == NULL || code->co_name != last_name) { | |
| if (cnt > TB_RECURSIVE_CUTOFF) { | |
| err = tb_print_line_repeated(f, cnt); | |
| } | |
| last_file = code->co_filename; | |
| last_line = tb->tb_lineno; | |
| last_name = code->co_name; | |
| cnt = 0; | |
| } | |
| cnt++; | |
| if (err == 0 && cnt <= TB_RECURSIVE_CUTOFF) { | |
| err = tb_displayline(tb, f, code->co_filename, tb->tb_lineno, | |
| tb->tb_frame, code->co_name); | |
| if (err == 0) { | |
| err = PyErr_CheckSignals(); | |
| } | |
| } | |
| Py_DECREF(code); | |
| tb = tb->tb_next; | |
| } | |
| if (err == 0 && cnt > TB_RECURSIVE_CUTOFF) { | |
| err = tb_print_line_repeated(f, cnt); | |
| } | |
| return err; | |
| } | |
| #define PyTraceBack_LIMIT 1000 | |
| int | |
| PyTraceBack_Print(PyObject *v, PyObject *f) | |
| { | |
| int err; | |
| PyObject *limitv; | |
| long limit = PyTraceBack_LIMIT; | |
| if (v == NULL) | |
| return 0; | |
| if (!PyTraceBack_Check(v)) { | |
| PyErr_BadInternalCall(); | |
| return -1; | |
| } | |
| limitv = PySys_GetObject("tracebacklimit"); | |
| if (limitv && PyLong_Check(limitv)) { | |
| int overflow; | |
| limit = PyLong_AsLongAndOverflow(limitv, &overflow); | |
| if (overflow > 0) { | |
| limit = LONG_MAX; | |
| } | |
| else if (limit <= 0) { | |
| return 0; | |
| } | |
| } | |
| err = PyFile_WriteString("Traceback (most recent call last):\n", f); | |
| if (!err) | |
| err = tb_printinternal((PyTracebackObject *)v, f, limit); | |
| return err; | |
| } | |
| /* Format an integer in range [0; 0xffffffff] to decimal and write it | |
| into the file fd. | |
| This function is signal safe. */ | |
| void | |
| _Py_DumpDecimal(int fd, size_t value) | |
| { | |
| /* maximum number of characters required for output of %lld or %p. | |
| We need at most ceil(log10(256)*SIZEOF_LONG_LONG) digits, | |
| plus 1 for the null byte. 53/22 is an upper bound for log10(256). */ | |
| char buffer[1 + (sizeof(size_t)*53-1) / 22 + 1]; | |
| char *ptr, *end; | |
| end = &buffer[Py_ARRAY_LENGTH(buffer) - 1]; | |
| ptr = end; | |
| *ptr = '\0'; | |
| do { | |
| --ptr; | |
| assert(ptr >= buffer); | |
| *ptr = '0' + (value % 10); | |
| value /= 10; | |
| } while (value); | |
| _Py_write_noraise(fd, ptr, end - ptr); | |
| } | |
| /* Format an integer as hexadecimal with width digits into fd file descriptor. | |
| The function is signal safe. */ | |
| void | |
| _Py_DumpHexadecimal(int fd, uintptr_t value, Py_ssize_t width) | |
| { | |
| char buffer[sizeof(uintptr_t) * 2 + 1], *ptr, *end; | |
| const Py_ssize_t size = Py_ARRAY_LENGTH(buffer) - 1; | |
| if (width > size) | |
| width = size; | |
| /* it's ok if width is negative */ | |
| end = &buffer[size]; | |
| ptr = end; | |
| *ptr = '\0'; | |
| do { | |
| --ptr; | |
| assert(ptr >= buffer); | |
| *ptr = Py_hexdigits[value & 15]; | |
| value >>= 4; | |
| } while ((end - ptr) < width || value); | |
| _Py_write_noraise(fd, ptr, end - ptr); | |
| } | |
| void | |
| _Py_DumpASCII(int fd, PyObject *text) | |
| { | |
| PyASCIIObject *ascii = (PyASCIIObject *)text; | |
| Py_ssize_t i, size; | |
| int truncated; | |
| int kind; | |
| void *data = NULL; | |
| wchar_t *wstr = NULL; | |
| Py_UCS4 ch; | |
| if (!PyUnicode_Check(text)) | |
| return; | |
| size = ascii->length; | |
| kind = ascii->state.kind; | |
| if (kind == PyUnicode_WCHAR_KIND) { | |
| wstr = ((PyASCIIObject *)text)->wstr; | |
| if (wstr == NULL) | |
| return; | |
| size = ((PyCompactUnicodeObject *)text)->wstr_length; | |
| } | |
| else if (ascii->state.compact) { | |
| if (ascii->state.ascii) | |
| data = ((PyASCIIObject*)text) + 1; | |
| else | |
| data = ((PyCompactUnicodeObject*)text) + 1; | |
| } | |
| else { | |
| data = ((PyUnicodeObject *)text)->data.any; | |
| if (data == NULL) | |
| return; | |
| } | |
| if (MAX_STRING_LENGTH < size) { | |
| size = MAX_STRING_LENGTH; | |
| truncated = 1; | |
| } | |
| else { | |
| truncated = 0; | |
| } | |
| for (i=0; i < size; i++) { | |
| if (kind != PyUnicode_WCHAR_KIND) | |
| ch = PyUnicode_READ(kind, data, i); | |
| else | |
| ch = wstr[i]; | |
| if (' ' <= ch && ch <= 126) { | |
| /* printable ASCII character */ | |
| char c = (char)ch; | |
| _Py_write_noraise(fd, &c, 1); | |
| } | |
| else if (ch <= 0xff) { | |
| PUTS(fd, "\\x"); | |
| _Py_DumpHexadecimal(fd, ch, 2); | |
| } | |
| else if (ch <= 0xffff) { | |
| PUTS(fd, "\\u"); | |
| _Py_DumpHexadecimal(fd, ch, 4); | |
| } | |
| else { | |
| PUTS(fd, "\\U"); | |
| _Py_DumpHexadecimal(fd, ch, 8); | |
| } | |
| } | |
| if (truncated) { | |
| PUTS(fd, "..."); | |
| } | |
| } | |
| /* Write a frame into the file fd: "File "xxx", line xxx in xxx". | |
| This function is signal safe. */ | |
| static void | |
| dump_frame(int fd, InterpreterFrame *frame) | |
| { | |
| PyCodeObject *code = frame->f_code; | |
| PUTS(fd, " File "); | |
| if (code->co_filename != NULL | |
| && PyUnicode_Check(code->co_filename)) | |
| { | |
| PUTS(fd, "\""); | |
| _Py_DumpASCII(fd, code->co_filename); | |
| PUTS(fd, "\""); | |
| } else { | |
| PUTS(fd, "???"); | |
| } | |
| int lineno = PyCode_Addr2Line(code, frame->f_lasti*sizeof(_Py_CODEUNIT)); | |
| PUTS(fd, ", line "); | |
| if (lineno >= 0) { | |
| _Py_DumpDecimal(fd, (size_t)lineno); | |
| } | |
| else { | |
| PUTS(fd, "???"); | |
| } | |
| PUTS(fd, " in "); | |
| if (code->co_name != NULL | |
| && PyUnicode_Check(code->co_name)) { | |
| _Py_DumpASCII(fd, code->co_name); | |
| } | |
| else { | |
| PUTS(fd, "???"); | |
| } | |
| PUTS(fd, "\n"); | |
| } | |
| static void | |
| dump_traceback(int fd, PyThreadState *tstate, int write_header) | |
| { | |
| InterpreterFrame *frame; | |
| unsigned int depth; | |
| if (write_header) { | |
| PUTS(fd, "Stack (most recent call first):\n"); | |
| } | |
| frame = tstate->frame; | |
| if (frame == NULL) { | |
| PUTS(fd, " <no Python frame>\n"); | |
| return; | |
| } | |
| depth = 0; | |
| while (1) { | |
| if (MAX_FRAME_DEPTH <= depth) { | |
| PUTS(fd, " ...\n"); | |
| break; | |
| } | |
| dump_frame(fd, frame); | |
| frame = frame->previous; | |
| if (frame == NULL) { | |
| break; | |
| } | |
| depth++; | |
| } | |
| } | |
| /* Dump the traceback of a Python thread into fd. Use write() to write the | |
| traceback and retry if write() is interrupted by a signal (failed with | |
| EINTR), but don't call the Python signal handler. | |
| The caller is responsible to call PyErr_CheckSignals() to call Python signal | |
| handlers if signals were received. */ | |
| void | |
| _Py_DumpTraceback(int fd, PyThreadState *tstate) | |
| { | |
| dump_traceback(fd, tstate, 1); | |
| } | |
| /* Write the thread identifier into the file 'fd': "Current thread 0xHHHH:\" if | |
| is_current is true, "Thread 0xHHHH:\n" otherwise. | |
| This function is signal safe. */ | |
| static void | |
| write_thread_id(int fd, PyThreadState *tstate, int is_current) | |
| { | |
| if (is_current) | |
| PUTS(fd, "Current thread 0x"); | |
| else | |
| PUTS(fd, "Thread 0x"); | |
| _Py_DumpHexadecimal(fd, | |
| tstate->thread_id, | |
| sizeof(unsigned long) * 2); | |
| PUTS(fd, " (most recent call first):\n"); | |
| } | |
| /* Dump the traceback of all Python threads into fd. Use write() to write the | |
| traceback and retry if write() is interrupted by a signal (failed with | |
| EINTR), but don't call the Python signal handler. | |
| The caller is responsible to call PyErr_CheckSignals() to call Python signal | |
| handlers if signals were received. */ | |
| const char* | |
| _Py_DumpTracebackThreads(int fd, PyInterpreterState *interp, | |
| PyThreadState *current_tstate) | |
| { | |
| PyThreadState *tstate; | |
| unsigned int nthreads; | |
| if (current_tstate == NULL) { | |
| /* _Py_DumpTracebackThreads() is called from signal handlers by | |
| faulthandler. | |
| SIGSEGV, SIGFPE, SIGABRT, SIGBUS and SIGILL are synchronous signals | |
| and are thus delivered to the thread that caused the fault. Get the | |
| Python thread state of the current thread. | |
| PyThreadState_Get() doesn't give the state of the thread that caused | |
| the fault if the thread released the GIL, and so | |
| _PyThreadState_GET() cannot be used. Read the thread specific | |
| storage (TSS) instead: call PyGILState_GetThisThreadState(). */ | |
| current_tstate = PyGILState_GetThisThreadState(); | |
| } | |
| if (interp == NULL) { | |
| if (current_tstate == NULL) { | |
| interp = _PyGILState_GetInterpreterStateUnsafe(); | |
| if (interp == NULL) { | |
| /* We need the interpreter state to get Python threads */ | |
| return "unable to get the interpreter state"; | |
| } | |
| } | |
| else { | |
| interp = current_tstate->interp; | |
| } | |
| } | |
| assert(interp != NULL); | |
| /* Get the current interpreter from the current thread */ | |
| tstate = PyInterpreterState_ThreadHead(interp); | |
| if (tstate == NULL) | |
| return "unable to get the thread head state"; | |
| /* Dump the traceback of each thread */ | |
| tstate = PyInterpreterState_ThreadHead(interp); | |
| nthreads = 0; | |
| _Py_BEGIN_SUPPRESS_IPH | |
| do | |
| { | |
| if (nthreads != 0) | |
| PUTS(fd, "\n"); | |
| if (nthreads >= MAX_NTHREADS) { | |
| PUTS(fd, "...\n"); | |
| break; | |
| } | |
| write_thread_id(fd, tstate, tstate == current_tstate); | |
| if (tstate == current_tstate && tstate->interp->gc.collecting) { | |
| PUTS(fd, " Garbage-collecting\n"); | |
| } | |
| dump_traceback(fd, tstate, 0); | |
| tstate = PyThreadState_Next(tstate); | |
| nthreads++; | |
| } while (tstate != NULL); | |
| _Py_END_SUPPRESS_IPH | |
| return NULL; | |
| } | |