Commit 7d99b0f0 authored by Stefan Behnel's avatar Stefan Behnel Committed by GitHub

Avoid acquiring the GIL at the end of nogil functions (GH-3556)

Acquire the GIL in nogil functions only when strictly needed on function exit, e.g. for cleaning up temp variables from with-gil blocks or adding tracebacks.

Closes GH-3554.
parent 25b7d7e4
...@@ -2401,8 +2401,8 @@ class CCodeWriter(object): ...@@ -2401,8 +2401,8 @@ class CCodeWriter(object):
UtilityCode.load_cached("ForceInitThreads", "ModuleSetupCode.c")) UtilityCode.load_cached("ForceInitThreads", "ModuleSetupCode.c"))
self.putln('__Pyx_RefNannySetupContext(%s, %d);' % (name, acquire_gil and 1 or 0)) self.putln('__Pyx_RefNannySetupContext(%s, %d);' % (name, acquire_gil and 1 or 0))
def put_finish_refcount_context(self): def put_finish_refcount_context(self, nogil=False):
self.putln("__Pyx_RefNannyFinishContext();") self.putln("__Pyx_RefNannyFinishContextNogil()" if nogil else "__Pyx_RefNannyFinishContext();")
def put_add_traceback(self, qualified_name, include_cline=True): def put_add_traceback(self, qualified_name, include_cline=True):
""" """
......
...@@ -1847,11 +1847,10 @@ class FuncDefNode(StatNode, BlockNode): ...@@ -1847,11 +1847,10 @@ class FuncDefNode(StatNode, BlockNode):
use_refnanny = not lenv.nogil or lenv.has_with_gil_block use_refnanny = not lenv.nogil or lenv.has_with_gil_block
gilstate_decl = code.insertion_point()
if acquire_gil or acquire_gil_for_var_decls_only: if acquire_gil or acquire_gil_for_var_decls_only:
code.put_ensure_gil() code.put_ensure_gil()
code.funcstate.gil_owned = True code.funcstate.gil_owned = True
elif lenv.nogil and lenv.has_with_gil_block:
code.declare_gilstate()
if profile or linetrace: if profile or linetrace:
if not self.is_generator: if not self.is_generator:
...@@ -1974,6 +1973,19 @@ class FuncDefNode(StatNode, BlockNode): ...@@ -1974,6 +1973,19 @@ class FuncDefNode(StatNode, BlockNode):
code.putln("") code.putln("")
code.putln("/* function exit code */") code.putln("/* function exit code */")
gil_owned = {
'success': code.funcstate.gil_owned,
'error': code.funcstate.gil_owned,
'gil_state_declared': False,
}
def assure_gil(code_path):
if not gil_owned[code_path]:
if not gil_owned['gil_state_declared']:
gilstate_decl.declare_gilstate()
gil_owned['gil_state_declared'] = True
code.put_ensure_gil(declare_gilstate=False)
gil_owned[code_path] = True
# ----- Default return value # ----- Default return value
return_type = self.return_type return_type = self.return_type
if not self.body.is_terminator: if not self.body.is_terminator:
...@@ -1982,6 +1994,7 @@ class FuncDefNode(StatNode, BlockNode): ...@@ -1982,6 +1994,7 @@ class FuncDefNode(StatNode, BlockNode):
# lhs = "(PyObject *)%s" % Naming.retval_cname # lhs = "(PyObject *)%s" % Naming.retval_cname
#else: #else:
lhs = Naming.retval_cname lhs = Naming.retval_cname
assure_gil('success')
code.put_init_to_py_none(lhs, return_type) code.put_init_to_py_none(lhs, return_type)
elif not return_type.is_memoryviewslice: elif not return_type.is_memoryviewslice:
# memory view structs receive their default value on initialisation # memory view structs receive their default value on initialisation
...@@ -2006,6 +2019,7 @@ class FuncDefNode(StatNode, BlockNode): ...@@ -2006,6 +2019,7 @@ class FuncDefNode(StatNode, BlockNode):
code.globalstate.use_utility_code(restore_exception_utility_code) code.globalstate.use_utility_code(restore_exception_utility_code)
code.putln("{ PyObject *__pyx_type, *__pyx_value, *__pyx_tb;") code.putln("{ PyObject *__pyx_type, *__pyx_value, *__pyx_tb;")
code.putln("__Pyx_PyThreadState_declare") code.putln("__Pyx_PyThreadState_declare")
assure_gil('error')
code.putln("__Pyx_PyThreadState_assign") code.putln("__Pyx_PyThreadState_assign")
code.putln("__Pyx_ErrFetch(&__pyx_type, &__pyx_value, &__pyx_tb);") code.putln("__Pyx_ErrFetch(&__pyx_type, &__pyx_value, &__pyx_tb);")
for entry in used_buffer_entries: for entry in used_buffer_entries:
...@@ -2026,20 +2040,14 @@ class FuncDefNode(StatNode, BlockNode): ...@@ -2026,20 +2040,14 @@ class FuncDefNode(StatNode, BlockNode):
# code.globalstate.use_utility_code(get_exception_tuple_utility_code) # code.globalstate.use_utility_code(get_exception_tuple_utility_code)
# code.put_trace_exception() # code.put_trace_exception()
if lenv.nogil and not lenv.has_with_gil_block: assure_gil('error')
code.putln("{")
code.put_ensure_gil()
code.put_add_traceback(self.entry.qualified_name) code.put_add_traceback(self.entry.qualified_name)
if lenv.nogil and not lenv.has_with_gil_block:
code.put_release_ensured_gil()
code.putln("}")
else: else:
warning(self.entry.pos, warning(self.entry.pos,
"Unraisable exception in function '%s'." % "Unraisable exception in function '%s'." %
self.entry.qualified_name, 0) self.entry.qualified_name, 0)
code.put_unraisable(self.entry.qualified_name, lenv.nogil) assure_gil('error')
code.put_unraisable(self.entry.qualified_name)
default_retval = return_type.default_value default_retval = return_type.default_value
if err_val is None and default_retval: if err_val is None and default_retval:
err_val = default_retval err_val = default_retval
...@@ -2050,19 +2058,33 @@ class FuncDefNode(StatNode, BlockNode): ...@@ -2050,19 +2058,33 @@ class FuncDefNode(StatNode, BlockNode):
code.putln("__Pyx_pretend_to_initialize(&%s);" % Naming.retval_cname) code.putln("__Pyx_pretend_to_initialize(&%s);" % Naming.retval_cname)
if is_getbuffer_slot: if is_getbuffer_slot:
assure_gil('error')
self.getbuffer_error_cleanup(code) self.getbuffer_error_cleanup(code)
# If we are using the non-error cleanup section we should # If we are using the non-error cleanup section we should
# jump past it if we have an error. The if-test below determine # jump past it if we have an error. The if-test below determine
# whether this section is used. # whether this section is used.
if buffers_present or is_getbuffer_slot or return_type.is_memoryviewslice: if buffers_present or is_getbuffer_slot or return_type.is_memoryviewslice:
# In the buffer cases, we already called assure_gil('error') and own the GIL.
assert gil_owned['error'] or return_type.is_memoryviewslice
code.put_goto(code.return_from_error_cleanup_label) code.put_goto(code.return_from_error_cleanup_label)
else:
# align error and success GIL state
if gil_owned['success']:
assure_gil('error')
elif gil_owned['error']:
code.put_release_ensured_gil()
gil_owned['error'] = False
# ----- Non-error return cleanup # ----- Non-error return cleanup
code.put_label(code.return_label) code.put_label(code.return_label)
assert gil_owned['error'] == gil_owned['success'], "%s != %s" % (gil_owned['error'], gil_owned['success'])
for entry in used_buffer_entries: for entry in used_buffer_entries:
assure_gil('success')
Buffer.put_release_buffer_code(code, entry) Buffer.put_release_buffer_code(code, entry)
if is_getbuffer_slot: if is_getbuffer_slot:
assure_gil('success')
self.getbuffer_normal_cleanup(code) self.getbuffer_normal_cleanup(code)
if return_type.is_memoryviewslice: if return_type.is_memoryviewslice:
...@@ -2072,16 +2094,21 @@ class FuncDefNode(StatNode, BlockNode): ...@@ -2072,16 +2094,21 @@ class FuncDefNode(StatNode, BlockNode):
cond = code.unlikely(return_type.error_condition(Naming.retval_cname)) cond = code.unlikely(return_type.error_condition(Naming.retval_cname))
code.putln( code.putln(
'if (%s) {' % cond) 'if (%s) {' % cond)
if env.nogil: if not gil_owned['success']:
code.put_ensure_gil() code.put_ensure_gil()
code.putln( code.putln(
'PyErr_SetString(PyExc_TypeError, "Memoryview return value is not initialized");') 'PyErr_SetString(PyExc_TypeError, "Memoryview return value is not initialized");')
if env.nogil: if not gil_owned['success']:
code.put_release_ensured_gil() code.put_release_ensured_gil()
code.putln( code.putln(
'}') '}')
# ----- Return cleanup for both error and no-error return # ----- Return cleanup for both error and no-error return
if code.label_used(code.return_from_error_cleanup_label):
# If we came through the success path, then we took the same GIL decisions as for jumping here.
# If we came through the error path and did not jump, then we aligned both paths above.
# In the end, all paths are aligned from this point on.
assert gil_owned['error'] == gil_owned['success'], "%s != %s" % (gil_owned['error'], gil_owned['success'])
code.put_label(code.return_from_error_cleanup_label) code.put_label(code.return_from_error_cleanup_label)
for entry in lenv.var_entries: for entry in lenv.var_entries:
...@@ -2110,6 +2137,7 @@ class FuncDefNode(StatNode, BlockNode): ...@@ -2110,6 +2137,7 @@ class FuncDefNode(StatNode, BlockNode):
# FIXME use entry.xdecref_cleanup - del arg seems to be the problem # FIXME use entry.xdecref_cleanup - del arg seems to be the problem
code.put_var_xdecref(entry, have_gil=not lenv.nogil) code.put_var_xdecref(entry, have_gil=not lenv.nogil)
if self.needs_closure: if self.needs_closure:
assure_gil('success')
code.put_decref(Naming.cur_scope_cname, lenv.scope_class.type) code.put_decref(Naming.cur_scope_cname, lenv.scope_class.type)
# ----- Return # ----- Return
...@@ -2124,6 +2152,7 @@ class FuncDefNode(StatNode, BlockNode): ...@@ -2124,6 +2152,7 @@ class FuncDefNode(StatNode, BlockNode):
if self.entry.is_special and self.entry.name == "__hash__": if self.entry.is_special and self.entry.name == "__hash__":
# Returning -1 for __hash__ is supposed to signal an error # Returning -1 for __hash__ is supposed to signal an error
# We do as Python instances and coerce -1 into -2. # We do as Python instances and coerce -1 into -2.
assure_gil('success')
code.putln("if (unlikely(%s == -1) && !PyErr_Occurred()) %s = -2;" % ( code.putln("if (unlikely(%s == -1) && !PyErr_Occurred()) %s = -2;" % (
Naming.retval_cname, Naming.retval_cname)) Naming.retval_cname, Naming.retval_cname))
...@@ -2133,16 +2162,16 @@ class FuncDefNode(StatNode, BlockNode): ...@@ -2133,16 +2162,16 @@ class FuncDefNode(StatNode, BlockNode):
# generators are traced when iterated, not at creation # generators are traced when iterated, not at creation
if return_type.is_pyobject: if return_type.is_pyobject:
code.put_trace_return( code.put_trace_return(
Naming.retval_cname, nogil=not code.funcstate.gil_owned) Naming.retval_cname, nogil=not gil_owned['success'])
else: else:
code.put_trace_return( code.put_trace_return(
"Py_None", nogil=not code.funcstate.gil_owned) "Py_None", nogil=not gil_owned['success'])
if not lenv.nogil: if not lenv.nogil:
# GIL holding function # GIL holding function
code.put_finish_refcount_context() code.put_finish_refcount_context(nogil=not gil_owned['success'])
if acquire_gil or (lenv.nogil and lenv.has_with_gil_block): if acquire_gil or (lenv.nogil and gil_owned['success']):
# release the GIL (note that with-gil blocks acquire it on exit in their EnsureGILNode) # release the GIL (note that with-gil blocks acquire it on exit in their EnsureGILNode)
code.put_release_ensured_gil() code.put_release_ensured_gil()
code.funcstate.gil_owned = False code.funcstate.gil_owned = False
......
...@@ -1870,19 +1870,6 @@ if VALUE is not None: ...@@ -1870,19 +1870,6 @@ if VALUE is not None:
return node return node
def _handle_nogil_cleanup(self, lenv, node):
"Handle cleanup for 'with gil' blocks in nogil functions."
if lenv.nogil and lenv.has_with_gil_block:
# Acquire the GIL for cleanup in 'nogil' functions, by wrapping
# the entire function body in try/finally.
# The corresponding release will be taken care of by
# Nodes.FuncDefNode.generate_function_definitions()
node.body = Nodes.NogilTryFinallyStatNode(
node.body.pos,
body=node.body,
finally_clause=Nodes.EnsureGILNode(node.body.pos),
finally_except_clause=Nodes.EnsureGILNode(node.body.pos))
def _handle_fused(self, node): def _handle_fused(self, node):
if node.is_generator and node.has_fused_arguments: if node.is_generator and node.has_fused_arguments:
node.has_fused_arguments = False node.has_fused_arguments = False
...@@ -1925,7 +1912,6 @@ if VALUE is not None: ...@@ -1925,7 +1912,6 @@ if VALUE is not None:
node = self._create_fused_function(env, node) node = self._create_fused_function(env, node)
else: else:
node.body.analyse_declarations(lenv) node.body.analyse_declarations(lenv)
self._handle_nogil_cleanup(lenv, node)
self._super_visit_FuncDefNode(node) self._super_visit_FuncDefNode(node)
self.seen_vars_stack.pop() self.seen_vars_stack.pop()
......
...@@ -1374,6 +1374,11 @@ static CYTHON_INLINE int __Pyx_Is_Little_Endian(void) ...@@ -1374,6 +1374,11 @@ static CYTHON_INLINE int __Pyx_Is_Little_Endian(void)
#define __Pyx_RefNannySetupContext(name, acquire_gil) \ #define __Pyx_RefNannySetupContext(name, acquire_gil) \
__pyx_refnanny = __Pyx_RefNanny->SetupContext((name), __LINE__, __FILE__) __pyx_refnanny = __Pyx_RefNanny->SetupContext((name), __LINE__, __FILE__)
#endif #endif
#define __Pyx_RefNannyFinishContextNogil() { \
PyGILState_STATE __pyx_gilstate_save = PyGILState_Ensure(); \
__Pyx_RefNannyFinishContext(); \
PyGILState_Release(__pyx_gilstate_save); \
}
#define __Pyx_RefNannyFinishContext() \ #define __Pyx_RefNannyFinishContext() \
__Pyx_RefNanny->FinishContext(&__pyx_refnanny) __Pyx_RefNanny->FinishContext(&__pyx_refnanny)
#define __Pyx_INCREF(r) __Pyx_RefNanny->INCREF(__pyx_refnanny, (PyObject *)(r), __LINE__) #define __Pyx_INCREF(r) __Pyx_RefNanny->INCREF(__pyx_refnanny, (PyObject *)(r), __LINE__)
...@@ -1387,6 +1392,7 @@ static CYTHON_INLINE int __Pyx_Is_Little_Endian(void) ...@@ -1387,6 +1392,7 @@ static CYTHON_INLINE int __Pyx_Is_Little_Endian(void)
#else #else
#define __Pyx_RefNannyDeclarations #define __Pyx_RefNannyDeclarations
#define __Pyx_RefNannySetupContext(name, acquire_gil) #define __Pyx_RefNannySetupContext(name, acquire_gil)
#define __Pyx_RefNannyFinishContextNogil()
#define __Pyx_RefNannyFinishContext() #define __Pyx_RefNannyFinishContext()
#define __Pyx_INCREF(r) Py_INCREF(r) #define __Pyx_INCREF(r) Py_INCREF(r)
#define __Pyx_DECREF(r) Py_DECREF(r) #define __Pyx_DECREF(r) Py_DECREF(r)
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment