You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1315 lines
44 KiB
Python

# sql/lambdas.py
# Copyright (C) 2005-2022 the SQLAlchemy authors and contributors
# <see AUTHORS file>
#
# This module is part of SQLAlchemy and is released under
# the MIT License: https://www.opensource.org/licenses/mit-license.php
import inspect
import itertools
import operator
import sys
import threading
import types
import weakref
from . import coercions
from . import elements
from . import roles
from . import schema
from . import traversals
from . import type_api
from . import visitors
from .base import _clone
from .base import Options
from .operators import ColumnOperators
from .. import exc
from .. import inspection
from .. import util
from ..util import collections_abc
from ..util import compat
_closure_per_cache_key = util.LRUCache(1000)
class LambdaOptions(Options):
enable_tracking = True
track_closure_variables = True
track_on = None
global_track_bound_values = True
track_bound_values = True
lambda_cache = None
def lambda_stmt(
lmb,
enable_tracking=True,
track_closure_variables=True,
track_on=None,
global_track_bound_values=True,
track_bound_values=True,
lambda_cache=None,
):
"""Produce a SQL statement that is cached as a lambda.
The Python code object within the lambda is scanned for both Python
literals that will become bound parameters as well as closure variables
that refer to Core or ORM constructs that may vary. The lambda itself
will be invoked only once per particular set of constructs detected.
E.g.::
from sqlalchemy import lambda_stmt
stmt = lambda_stmt(lambda: table.select())
stmt += lambda s: s.where(table.c.id == 5)
result = connection.execute(stmt)
The object returned is an instance of :class:`_sql.StatementLambdaElement`.
.. versionadded:: 1.4
:param lmb: a Python function, typically a lambda, which takes no arguments
and returns a SQL expression construct
:param enable_tracking: when False, all scanning of the given lambda for
changes in closure variables or bound parameters is disabled. Use for
a lambda that produces the identical results in all cases with no
parameterization.
:param track_closure_variables: when False, changes in closure variables
within the lambda will not be scanned. Use for a lambda where the
state of its closure variables will never change the SQL structure
returned by the lambda.
:param track_bound_values: when False, bound parameter tracking will
be disabled for the given lambda. Use for a lambda that either does
not produce any bound values, or where the initial bound values never
change.
:param global_track_bound_values: when False, bound parameter tracking
will be disabled for the entire statement including additional links
added via the :meth:`_sql.StatementLambdaElement.add_criteria` method.
:param lambda_cache: a dictionary or other mapping-like object where
information about the lambda's Python code as well as the tracked closure
variables in the lambda itself will be stored. Defaults
to a global LRU cache. This cache is independent of the "compiled_cache"
used by the :class:`_engine.Connection` object.
.. seealso::
:ref:`engine_lambda_caching`
"""
return StatementLambdaElement(
lmb,
roles.StatementRole,
LambdaOptions(
enable_tracking=enable_tracking,
track_on=track_on,
track_closure_variables=track_closure_variables,
global_track_bound_values=global_track_bound_values,
track_bound_values=track_bound_values,
lambda_cache=lambda_cache,
),
)
class LambdaElement(elements.ClauseElement):
"""A SQL construct where the state is stored as an un-invoked lambda.
The :class:`_sql.LambdaElement` is produced transparently whenever
passing lambda expressions into SQL constructs, such as::
stmt = select(table).where(lambda: table.c.col == parameter)
The :class:`_sql.LambdaElement` is the base of the
:class:`_sql.StatementLambdaElement` which represents a full statement
within a lambda.
.. versionadded:: 1.4
.. seealso::
:ref:`engine_lambda_caching`
"""
__visit_name__ = "lambda_element"
_is_lambda_element = True
_traverse_internals = [
("_resolved", visitors.InternalTraversal.dp_clauseelement)
]
_transforms = ()
parent_lambda = None
def __repr__(self):
return "%s(%r)" % (self.__class__.__name__, self.fn.__code__)
def __init__(
self, fn, role, opts=LambdaOptions, apply_propagate_attrs=None
):
self.fn = fn
self.role = role
self.tracker_key = (fn.__code__,)
self.opts = opts
if apply_propagate_attrs is None and (role is roles.StatementRole):
apply_propagate_attrs = self
rec = self._retrieve_tracker_rec(fn, apply_propagate_attrs, opts)
if apply_propagate_attrs is not None:
propagate_attrs = rec.propagate_attrs
if propagate_attrs:
apply_propagate_attrs._propagate_attrs = propagate_attrs
def _retrieve_tracker_rec(self, fn, apply_propagate_attrs, opts):
lambda_cache = opts.lambda_cache
if lambda_cache is None:
lambda_cache = _closure_per_cache_key
tracker_key = self.tracker_key
fn = self.fn
closure = fn.__closure__
tracker = AnalyzedCode.get(
fn,
self,
opts,
)
self._resolved_bindparams = bindparams = []
if self.parent_lambda is not None:
parent_closure_cache_key = self.parent_lambda.closure_cache_key
else:
parent_closure_cache_key = ()
if parent_closure_cache_key is not traversals.NO_CACHE:
anon_map = traversals.anon_map()
cache_key = tuple(
[
getter(closure, opts, anon_map, bindparams)
for getter in tracker.closure_trackers
]
)
if traversals.NO_CACHE not in anon_map:
cache_key = parent_closure_cache_key + cache_key
self.closure_cache_key = cache_key
try:
rec = lambda_cache[tracker_key + cache_key]
except KeyError:
rec = None
else:
cache_key = traversals.NO_CACHE
rec = None
else:
cache_key = traversals.NO_CACHE
rec = None
self.closure_cache_key = cache_key
if rec is None:
if cache_key is not traversals.NO_CACHE:
with AnalyzedCode._generation_mutex:
key = tracker_key + cache_key
if key not in lambda_cache:
rec = AnalyzedFunction(
tracker, self, apply_propagate_attrs, fn
)
rec.closure_bindparams = bindparams
lambda_cache[key] = rec
else:
rec = lambda_cache[key]
else:
rec = NonAnalyzedFunction(self._invoke_user_fn(fn))
else:
bindparams[:] = [
orig_bind._with_value(new_bind.value, maintain_key=True)
for orig_bind, new_bind in zip(
rec.closure_bindparams, bindparams
)
]
self._rec = rec
if cache_key is not traversals.NO_CACHE:
if self.parent_lambda is not None:
bindparams[:0] = self.parent_lambda._resolved_bindparams
lambda_element = self
while lambda_element is not None:
rec = lambda_element._rec
if rec.bindparam_trackers:
tracker_instrumented_fn = rec.tracker_instrumented_fn
for tracker in rec.bindparam_trackers:
tracker(
lambda_element.fn,
tracker_instrumented_fn,
bindparams,
)
lambda_element = lambda_element.parent_lambda
return rec
def __getattr__(self, key):
return getattr(self._rec.expected_expr, key)
@property
def _is_sequence(self):
return self._rec.is_sequence
@property
def _select_iterable(self):
if self._is_sequence:
return itertools.chain.from_iterable(
[element._select_iterable for element in self._resolved]
)
else:
return self._resolved._select_iterable
@property
def _from_objects(self):
if self._is_sequence:
return itertools.chain.from_iterable(
[element._from_objects for element in self._resolved]
)
else:
return self._resolved._from_objects
def _param_dict(self):
return {b.key: b.value for b in self._resolved_bindparams}
def _setup_binds_for_tracked_expr(self, expr):
bindparam_lookup = {b.key: b for b in self._resolved_bindparams}
def replace(thing):
if isinstance(thing, elements.BindParameter):
if thing.key in bindparam_lookup:
bind = bindparam_lookup[thing.key]
if thing.expanding:
bind.expanding = True
bind.expand_op = thing.expand_op
bind.type = thing.type
return bind
if self._rec.is_sequence:
expr = [
visitors.replacement_traverse(sub_expr, {}, replace)
for sub_expr in expr
]
elif getattr(expr, "is_clause_element", False):
expr = visitors.replacement_traverse(expr, {}, replace)
return expr
def _copy_internals(
self, clone=_clone, deferred_copy_internals=None, **kw
):
# TODO: this needs A LOT of tests
self._resolved = clone(
self._resolved,
deferred_copy_internals=deferred_copy_internals,
**kw
)
@util.memoized_property
def _resolved(self):
expr = self._rec.expected_expr
if self._resolved_bindparams:
expr = self._setup_binds_for_tracked_expr(expr)
return expr
def _gen_cache_key(self, anon_map, bindparams):
if self.closure_cache_key is traversals.NO_CACHE:
anon_map[traversals.NO_CACHE] = True
return None
cache_key = (
self.fn.__code__,
self.__class__,
) + self.closure_cache_key
parent = self.parent_lambda
while parent is not None:
cache_key = (
(parent.fn.__code__,) + parent.closure_cache_key + cache_key
)
parent = parent.parent_lambda
if self._resolved_bindparams:
bindparams.extend(self._resolved_bindparams)
return cache_key
def _invoke_user_fn(self, fn, *arg):
return fn()
class DeferredLambdaElement(LambdaElement):
"""A LambdaElement where the lambda accepts arguments and is
invoked within the compile phase with special context.
This lambda doesn't normally produce its real SQL expression outside of the
compile phase. It is passed a fixed set of initial arguments
so that it can generate a sample expression.
"""
def __init__(self, fn, role, opts=LambdaOptions, lambda_args=()):
self.lambda_args = lambda_args
super(DeferredLambdaElement, self).__init__(fn, role, opts)
def _invoke_user_fn(self, fn, *arg):
return fn(*self.lambda_args)
def _resolve_with_args(self, *lambda_args):
tracker_fn = self._rec.tracker_instrumented_fn
expr = tracker_fn(*lambda_args)
expr = coercions.expect(self.role, expr)
expr = self._setup_binds_for_tracked_expr(expr)
# this validation is getting very close, but not quite, to achieving
# #5767. The problem is if the base lambda uses an unnamed column
# as is very common with mixins, the parameter name is different
# and it produces a false positive; that is, for the documented case
# that is exactly what people will be doing, it doesn't work, so
# I'm not really sure how to handle this right now.
# expected_binds = [
# b._orig_key
# for b in self._rec.expr._generate_cache_key()[1]
# if b.required
# ]
# got_binds = [
# b._orig_key for b in expr._generate_cache_key()[1] if b.required
# ]
# if expected_binds != got_binds:
# raise exc.InvalidRequestError(
# "Lambda callable at %s produced a different set of bound "
# "parameters than its original run: %s"
# % (self.fn.__code__, ", ".join(got_binds))
# )
# TODO: TEST TEST TEST, this is very out there
for deferred_copy_internals in self._transforms:
expr = deferred_copy_internals(expr)
return expr
def _copy_internals(
self, clone=_clone, deferred_copy_internals=None, **kw
):
super(DeferredLambdaElement, self)._copy_internals(
clone=clone,
deferred_copy_internals=deferred_copy_internals, # **kw
opts=kw,
)
# TODO: A LOT A LOT of tests. for _resolve_with_args, we don't know
# our expression yet. so hold onto the replacement
if deferred_copy_internals:
self._transforms += (deferred_copy_internals,)
class StatementLambdaElement(roles.AllowsLambdaRole, LambdaElement):
"""Represent a composable SQL statement as a :class:`_sql.LambdaElement`.
The :class:`_sql.StatementLambdaElement` is constructed using the
:func:`_sql.lambda_stmt` function::
from sqlalchemy import lambda_stmt
stmt = lambda_stmt(lambda: select(table))
Once constructed, additional criteria can be built onto the statement
by adding subsequent lambdas, which accept the existing statement
object as a single parameter::
stmt += lambda s: s.where(table.c.col == parameter)
.. versionadded:: 1.4
.. seealso::
:ref:`engine_lambda_caching`
"""
def __add__(self, other):
return self.add_criteria(other)
def add_criteria(
self,
other,
enable_tracking=True,
track_on=None,
track_closure_variables=True,
track_bound_values=True,
):
"""Add new criteria to this :class:`_sql.StatementLambdaElement`.
E.g.::
>>> def my_stmt(parameter):
... stmt = lambda_stmt(
... lambda: select(table.c.x, table.c.y),
... )
... stmt = stmt.add_criteria(
... lambda: table.c.x > parameter
... )
... return stmt
The :meth:`_sql.StatementLambdaElement.add_criteria` method is
equivalent to using the Python addition operator to add a new
lambda, except that additional arguments may be added including
``track_closure_values`` and ``track_on``::
>>> def my_stmt(self, foo):
... stmt = lambda_stmt(
... lambda: select(func.max(foo.x, foo.y)),
... track_closure_variables=False
... )
... stmt = stmt.add_criteria(
... lambda: self.where_criteria,
... track_on=[self]
... )
... return stmt
See :func:`_sql.lambda_stmt` for a description of the parameters
accepted.
"""
opts = self.opts + dict(
enable_tracking=enable_tracking,
track_closure_variables=track_closure_variables,
global_track_bound_values=self.opts.global_track_bound_values,
track_on=track_on,
track_bound_values=track_bound_values,
)
return LinkedLambdaElement(other, parent_lambda=self, opts=opts)
def _execute_on_connection(
self, connection, multiparams, params, execution_options
):
if self._rec.expected_expr.supports_execution:
return connection._execute_clauseelement(
self, multiparams, params, execution_options
)
else:
raise exc.ObjectNotExecutableError(self)
@property
def _with_options(self):
return self._rec.expected_expr._with_options
@property
def _effective_plugin_target(self):
return self._rec.expected_expr._effective_plugin_target
@property
def _execution_options(self):
return self._rec.expected_expr._execution_options
def spoil(self):
"""Return a new :class:`.StatementLambdaElement` that will run
all lambdas unconditionally each time.
"""
return NullLambdaStatement(self.fn())
class NullLambdaStatement(roles.AllowsLambdaRole, elements.ClauseElement):
"""Provides the :class:`.StatementLambdaElement` API but does not
cache or analyze lambdas.
the lambdas are instead invoked immediately.
The intended use is to isolate issues that may arise when using
lambda statements.
"""
__visit_name__ = "lambda_element"
_is_lambda_element = True
_traverse_internals = [
("_resolved", visitors.InternalTraversal.dp_clauseelement)
]
def __init__(self, statement):
self._resolved = statement
self._propagate_attrs = statement._propagate_attrs
def __getattr__(self, key):
return getattr(self._resolved, key)
def __add__(self, other):
statement = other(self._resolved)
return NullLambdaStatement(statement)
def add_criteria(self, other, **kw):
statement = other(self._resolved)
return NullLambdaStatement(statement)
def _execute_on_connection(
self, connection, multiparams, params, execution_options
):
if self._resolved.supports_execution:
return connection._execute_clauseelement(
self, multiparams, params, execution_options
)
else:
raise exc.ObjectNotExecutableError(self)
class LinkedLambdaElement(StatementLambdaElement):
"""Represent subsequent links of a :class:`.StatementLambdaElement`."""
role = None
def __init__(self, fn, parent_lambda, opts):
self.opts = opts
self.fn = fn
self.parent_lambda = parent_lambda
self.tracker_key = parent_lambda.tracker_key + (fn.__code__,)
self._retrieve_tracker_rec(fn, self, opts)
self._propagate_attrs = parent_lambda._propagate_attrs
def _invoke_user_fn(self, fn, *arg):
return fn(self.parent_lambda._resolved)
class AnalyzedCode(object):
__slots__ = (
"track_closure_variables",
"track_bound_values",
"bindparam_trackers",
"closure_trackers",
"build_py_wrappers",
)
_fns = weakref.WeakKeyDictionary()
_generation_mutex = threading.RLock()
@classmethod
def get(cls, fn, lambda_element, lambda_kw, **kw):
try:
# TODO: validate kw haven't changed?
return cls._fns[fn.__code__]
except KeyError:
pass
with cls._generation_mutex:
# check for other thread already created object
if fn.__code__ in cls._fns:
return cls._fns[fn.__code__]
cls._fns[fn.__code__] = analyzed = AnalyzedCode(
fn, lambda_element, lambda_kw, **kw
)
return analyzed
def __init__(self, fn, lambda_element, opts):
if inspect.ismethod(fn):
raise exc.ArgumentError(
"Method %s may not be passed as a SQL expression" % fn
)
closure = fn.__closure__
self.track_bound_values = (
opts.track_bound_values and opts.global_track_bound_values
)
enable_tracking = opts.enable_tracking
track_on = opts.track_on
track_closure_variables = opts.track_closure_variables
self.track_closure_variables = track_closure_variables and not track_on
# a list of callables generated from _bound_parameter_getter_*
# functions. Each of these uses a PyWrapper object to retrieve
# a parameter value
self.bindparam_trackers = []
# a list of callables generated from _cache_key_getter_* functions
# these callables work to generate a cache key for the lambda
# based on what's inside its closure variables.
self.closure_trackers = []
self.build_py_wrappers = []
if enable_tracking:
if track_on:
self._init_track_on(track_on)
self._init_globals(fn)
if closure:
self._init_closure(fn)
self._setup_additional_closure_trackers(fn, lambda_element, opts)
def _init_track_on(self, track_on):
self.closure_trackers.extend(
self._cache_key_getter_track_on(idx, elem)
for idx, elem in enumerate(track_on)
)
def _init_globals(self, fn):
build_py_wrappers = self.build_py_wrappers
bindparam_trackers = self.bindparam_trackers
track_bound_values = self.track_bound_values
for name in fn.__code__.co_names:
if name not in fn.__globals__:
continue
_bound_value = self._roll_down_to_literal(fn.__globals__[name])
if coercions._deep_is_literal(_bound_value):
build_py_wrappers.append((name, None))
if track_bound_values:
bindparam_trackers.append(
self._bound_parameter_getter_func_globals(name)
)
def _init_closure(self, fn):
build_py_wrappers = self.build_py_wrappers
closure = fn.__closure__
track_bound_values = self.track_bound_values
track_closure_variables = self.track_closure_variables
bindparam_trackers = self.bindparam_trackers
closure_trackers = self.closure_trackers
for closure_index, (fv, cell) in enumerate(
zip(fn.__code__.co_freevars, closure)
):
_bound_value = self._roll_down_to_literal(cell.cell_contents)
if coercions._deep_is_literal(_bound_value):
build_py_wrappers.append((fv, closure_index))
if track_bound_values:
bindparam_trackers.append(
self._bound_parameter_getter_func_closure(
fv, closure_index
)
)
else:
# for normal cell contents, add them to a list that
# we can compare later when we get new lambdas. if
# any identities have changed, then we will
# recalculate the whole lambda and run it again.
if track_closure_variables:
closure_trackers.append(
self._cache_key_getter_closure_variable(
fn, fv, closure_index, cell.cell_contents
)
)
def _setup_additional_closure_trackers(self, fn, lambda_element, opts):
# an additional step is to actually run the function, then
# go through the PyWrapper objects that were set up to catch a bound
# parameter. then if they *didn't* make a param, oh they're another
# object in the closure we have to track for our cache key. so
# create trackers to catch those.
analyzed_function = AnalyzedFunction(
self,
lambda_element,
None,
fn,
)
closure_trackers = self.closure_trackers
for pywrapper in analyzed_function.closure_pywrappers:
if not pywrapper._sa__has_param:
closure_trackers.append(
self._cache_key_getter_tracked_literal(fn, pywrapper)
)
@classmethod
def _roll_down_to_literal(cls, element):
is_clause_element = hasattr(element, "__clause_element__")
if is_clause_element:
while not isinstance(
element, (elements.ClauseElement, schema.SchemaItem, type)
):
try:
element = element.__clause_element__()
except AttributeError:
break
if not is_clause_element:
insp = inspection.inspect(element, raiseerr=False)
if insp is not None:
try:
return insp.__clause_element__()
except AttributeError:
return insp
# TODO: should we coerce consts None/True/False here?
return element
else:
return element
def _bound_parameter_getter_func_globals(self, name):
"""Return a getter that will extend a list of bound parameters
with new entries from the ``__globals__`` collection of a particular
lambda.
"""
def extract_parameter_value(
current_fn, tracker_instrumented_fn, result
):
wrapper = tracker_instrumented_fn.__globals__[name]
object.__getattribute__(wrapper, "_extract_bound_parameters")(
current_fn.__globals__[name], result
)
return extract_parameter_value
def _bound_parameter_getter_func_closure(self, name, closure_index):
"""Return a getter that will extend a list of bound parameters
with new entries from the ``__closure__`` collection of a particular
lambda.
"""
def extract_parameter_value(
current_fn, tracker_instrumented_fn, result
):
wrapper = tracker_instrumented_fn.__closure__[
closure_index
].cell_contents
object.__getattribute__(wrapper, "_extract_bound_parameters")(
current_fn.__closure__[closure_index].cell_contents, result
)
return extract_parameter_value
def _cache_key_getter_track_on(self, idx, elem):
"""Return a getter that will extend a cache key with new entries
from the "track_on" parameter passed to a :class:`.LambdaElement`.
"""
if isinstance(elem, tuple):
# tuple must contain hascachekey elements
def get(closure, opts, anon_map, bindparams):
return tuple(
tup_elem._gen_cache_key(anon_map, bindparams)
for tup_elem in opts.track_on[idx]
)
elif isinstance(elem, traversals.HasCacheKey):
def get(closure, opts, anon_map, bindparams):
return opts.track_on[idx]._gen_cache_key(anon_map, bindparams)
else:
def get(closure, opts, anon_map, bindparams):
return opts.track_on[idx]
return get
def _cache_key_getter_closure_variable(
self,
fn,
variable_name,
idx,
cell_contents,
use_clause_element=False,
use_inspect=False,
):
"""Return a getter that will extend a cache key with new entries
from the ``__closure__`` collection of a particular lambda.
"""
if isinstance(cell_contents, traversals.HasCacheKey):
def get(closure, opts, anon_map, bindparams):
obj = closure[idx].cell_contents
if use_inspect:
obj = inspection.inspect(obj)
elif use_clause_element:
while hasattr(obj, "__clause_element__"):
if not getattr(obj, "is_clause_element", False):
obj = obj.__clause_element__()
return obj._gen_cache_key(anon_map, bindparams)
elif isinstance(cell_contents, types.FunctionType):
def get(closure, opts, anon_map, bindparams):
return closure[idx].cell_contents.__code__
elif isinstance(cell_contents, collections_abc.Sequence):
def get(closure, opts, anon_map, bindparams):
contents = closure[idx].cell_contents
try:
return tuple(
elem._gen_cache_key(anon_map, bindparams)
for elem in contents
)
except AttributeError as ae:
self._raise_for_uncacheable_closure_variable(
variable_name, fn, from_=ae
)
else:
# if the object is a mapped class or aliased class, or some
# other object in the ORM realm of things like that, imitate
# the logic used in coercions.expect() to roll it down to the
# SQL element
element = cell_contents
is_clause_element = False
while hasattr(element, "__clause_element__"):
is_clause_element = True
if not getattr(element, "is_clause_element", False):
element = element.__clause_element__()
else:
break
if not is_clause_element:
insp = inspection.inspect(element, raiseerr=False)
if insp is not None:
return self._cache_key_getter_closure_variable(
fn, variable_name, idx, insp, use_inspect=True
)
else:
return self._cache_key_getter_closure_variable(
fn, variable_name, idx, element, use_clause_element=True
)
self._raise_for_uncacheable_closure_variable(variable_name, fn)
return get
def _raise_for_uncacheable_closure_variable(
self, variable_name, fn, from_=None
):
util.raise_(
exc.InvalidRequestError(
"Closure variable named '%s' inside of lambda callable %s "
"does not refer to a cacheable SQL element, and also does not "
"appear to be serving as a SQL literal bound value based on "
"the default "
"SQL expression returned by the function. This variable "
"needs to remain outside the scope of a SQL-generating lambda "
"so that a proper cache key may be generated from the "
"lambda's state. Evaluate this variable outside of the "
"lambda, set track_on=[<elements>] to explicitly select "
"closure elements to track, or set "
"track_closure_variables=False to exclude "
"closure variables from being part of the cache key."
% (variable_name, fn.__code__),
),
from_=from_,
)
def _cache_key_getter_tracked_literal(self, fn, pytracker):
"""Return a getter that will extend a cache key with new entries
from the ``__closure__`` collection of a particular lambda.
this getter differs from _cache_key_getter_closure_variable
in that these are detected after the function is run, and PyWrapper
objects have recorded that a particular literal value is in fact
not being interpreted as a bound parameter.
"""
elem = pytracker._sa__to_evaluate
closure_index = pytracker._sa__closure_index
variable_name = pytracker._sa__name
return self._cache_key_getter_closure_variable(
fn, variable_name, closure_index, elem
)
class NonAnalyzedFunction(object):
__slots__ = ("expr",)
closure_bindparams = None
bindparam_trackers = None
def __init__(self, expr):
self.expr = expr
@property
def expected_expr(self):
return self.expr
class AnalyzedFunction(object):
__slots__ = (
"analyzed_code",
"fn",
"closure_pywrappers",
"tracker_instrumented_fn",
"expr",
"bindparam_trackers",
"expected_expr",
"is_sequence",
"propagate_attrs",
"closure_bindparams",
)
def __init__(
self,
analyzed_code,
lambda_element,
apply_propagate_attrs,
fn,
):
self.analyzed_code = analyzed_code
self.fn = fn
self.bindparam_trackers = analyzed_code.bindparam_trackers
self._instrument_and_run_function(lambda_element)
self._coerce_expression(lambda_element, apply_propagate_attrs)
def _instrument_and_run_function(self, lambda_element):
analyzed_code = self.analyzed_code
fn = self.fn
self.closure_pywrappers = closure_pywrappers = []
build_py_wrappers = analyzed_code.build_py_wrappers
if not build_py_wrappers:
self.tracker_instrumented_fn = tracker_instrumented_fn = fn
self.expr = lambda_element._invoke_user_fn(tracker_instrumented_fn)
else:
track_closure_variables = analyzed_code.track_closure_variables
closure = fn.__closure__
# will form the __closure__ of the function when we rebuild it
if closure:
new_closure = {
fv: cell.cell_contents
for fv, cell in zip(fn.__code__.co_freevars, closure)
}
else:
new_closure = {}
# will form the __globals__ of the function when we rebuild it
new_globals = fn.__globals__.copy()
for name, closure_index in build_py_wrappers:
if closure_index is not None:
value = closure[closure_index].cell_contents
new_closure[name] = bind = PyWrapper(
fn,
name,
value,
closure_index=closure_index,
track_bound_values=(
self.analyzed_code.track_bound_values
),
)
if track_closure_variables:
closure_pywrappers.append(bind)
else:
value = fn.__globals__[name]
new_globals[name] = bind = PyWrapper(fn, name, value)
# rewrite the original fn. things that look like they will
# become bound parameters are wrapped in a PyWrapper.
self.tracker_instrumented_fn = (
tracker_instrumented_fn
) = self._rewrite_code_obj(
fn,
[new_closure[name] for name in fn.__code__.co_freevars],
new_globals,
)
# now invoke the function. This will give us a new SQL
# expression, but all the places that there would be a bound
# parameter, the PyWrapper in its place will give us a bind
# with a predictable name we can match up later.
# additionally, each PyWrapper will log that it did in fact
# create a parameter, otherwise, it's some kind of Python
# object in the closure and we want to track that, to make
# sure it doesn't change to something else, or if it does,
# that we create a different tracked function with that
# variable.
self.expr = lambda_element._invoke_user_fn(tracker_instrumented_fn)
def _coerce_expression(self, lambda_element, apply_propagate_attrs):
"""Run the tracker-generated expression through coercion rules.
After the user-defined lambda has been invoked to produce a statement
for re-use, run it through coercion rules to both check that it's the
correct type of object and also to coerce it to its useful form.
"""
parent_lambda = lambda_element.parent_lambda
expr = self.expr
if parent_lambda is None:
if isinstance(expr, collections_abc.Sequence):
self.expected_expr = [
coercions.expect(
lambda_element.role,
sub_expr,
apply_propagate_attrs=apply_propagate_attrs,
)
for sub_expr in expr
]
self.is_sequence = True
else:
self.expected_expr = coercions.expect(
lambda_element.role,
expr,
apply_propagate_attrs=apply_propagate_attrs,
)
self.is_sequence = False
else:
self.expected_expr = expr
self.is_sequence = False
if apply_propagate_attrs is not None:
self.propagate_attrs = apply_propagate_attrs._propagate_attrs
else:
self.propagate_attrs = util.EMPTY_DICT
def _rewrite_code_obj(self, f, cell_values, globals_):
"""Return a copy of f, with a new closure and new globals
yes it works in pypy :P
"""
argrange = range(len(cell_values))
code = "def make_cells():\n"
if cell_values:
code += " (%s) = (%s)\n" % (
", ".join("i%d" % i for i in argrange),
", ".join("o%d" % i for i in argrange),
)
code += " def closure():\n"
code += " return %s\n" % ", ".join("i%d" % i for i in argrange)
code += " return closure.__closure__"
vars_ = {"o%d" % i: cell_values[i] for i in argrange}
compat.exec_(code, vars_, vars_)
closure = vars_["make_cells"]()
func = type(f)(
f.__code__, globals_, f.__name__, f.__defaults__, closure
)
if sys.version_info >= (3,):
func.__annotations__ = f.__annotations__
func.__kwdefaults__ = f.__kwdefaults__
func.__doc__ = f.__doc__
func.__module__ = f.__module__
return func
class PyWrapper(ColumnOperators):
"""A wrapper object that is injected into the ``__globals__`` and
``__closure__`` of a Python function.
When the function is instrumented with :class:`.PyWrapper` objects, it is
then invoked just once in order to set up the wrappers. We look through
all the :class:`.PyWrapper` objects we made to find the ones that generated
a :class:`.BindParameter` object, e.g. the expression system interpreted
something as a literal. Those positions in the globals/closure are then
ones that we will look at, each time a new lambda comes in that refers to
the same ``__code__`` object. In this way, we keep a single version of
the SQL expression that this lambda produced, without calling upon the
Python function that created it more than once, unless its other closure
variables have changed. The expression is then transformed to have the
new bound values embedded into it.
"""
def __init__(
self,
fn,
name,
to_evaluate,
closure_index=None,
getter=None,
track_bound_values=True,
):
self.fn = fn
self._name = name
self._to_evaluate = to_evaluate
self._param = None
self._has_param = False
self._bind_paths = {}
self._getter = getter
self._closure_index = closure_index
self.track_bound_values = track_bound_values
def __call__(self, *arg, **kw):
elem = object.__getattribute__(self, "_to_evaluate")
value = elem(*arg, **kw)
if (
self._sa_track_bound_values
and coercions._deep_is_literal(value)
and not isinstance(
# TODO: coverage where an ORM option or similar is here
value,
traversals.HasCacheKey,
)
):
name = object.__getattribute__(self, "_name")
raise exc.InvalidRequestError(
"Can't invoke Python callable %s() inside of lambda "
"expression argument at %s; lambda SQL constructs should "
"not invoke functions from closure variables to produce "
"literal values since the "
"lambda SQL system normally extracts bound values without "
"actually "
"invoking the lambda or any functions within it. Call the "
"function outside of the "
"lambda and assign to a local variable that is used in the "
"lambda as a closure variable, or set "
"track_bound_values=False if the return value of this "
"function is used in some other way other than a SQL bound "
"value." % (name, self._sa_fn.__code__)
)
else:
return value
def operate(self, op, *other, **kwargs):
elem = object.__getattribute__(self, "__clause_element__")()
return op(elem, *other, **kwargs)
def reverse_operate(self, op, other, **kwargs):
elem = object.__getattribute__(self, "__clause_element__")()
return op(other, elem, **kwargs)
def _extract_bound_parameters(self, starting_point, result_list):
param = object.__getattribute__(self, "_param")
if param is not None:
param = param._with_value(starting_point, maintain_key=True)
result_list.append(param)
for pywrapper in object.__getattribute__(self, "_bind_paths").values():
getter = object.__getattribute__(pywrapper, "_getter")
element = getter(starting_point)
pywrapper._sa__extract_bound_parameters(element, result_list)
def __clause_element__(self):
param = object.__getattribute__(self, "_param")
to_evaluate = object.__getattribute__(self, "_to_evaluate")
if param is None:
name = object.__getattribute__(self, "_name")
self._param = param = elements.BindParameter(
name, required=False, unique=True
)
self._has_param = True
param.type = type_api._resolve_value_to_type(to_evaluate)
return param._with_value(to_evaluate, maintain_key=True)
def __bool__(self):
to_evaluate = object.__getattribute__(self, "_to_evaluate")
return bool(to_evaluate)
def __nonzero__(self):
to_evaluate = object.__getattribute__(self, "_to_evaluate")
return bool(to_evaluate)
def __getattribute__(self, key):
if key.startswith("_sa_"):
return object.__getattribute__(self, key[4:])
elif key in (
"__clause_element__",
"operate",
"reverse_operate",
"__class__",
"__dict__",
):
return object.__getattribute__(self, key)
if key.startswith("__"):
elem = object.__getattribute__(self, "_to_evaluate")
return getattr(elem, key)
else:
return self._sa__add_getter(key, operator.attrgetter)
def __iter__(self):
elem = object.__getattribute__(self, "_to_evaluate")
return iter(elem)
def __getitem__(self, key):
elem = object.__getattribute__(self, "_to_evaluate")
if not hasattr(elem, "__getitem__"):
raise AttributeError("__getitem__")
if isinstance(key, PyWrapper):
# TODO: coverage
raise exc.InvalidRequestError(
"Dictionary keys / list indexes inside of a cached "
"lambda must be Python literals only"
)
return self._sa__add_getter(key, operator.itemgetter)
def _add_getter(self, key, getter_fn):
bind_paths = object.__getattribute__(self, "_bind_paths")
bind_path_key = (key, getter_fn)
if bind_path_key in bind_paths:
return bind_paths[bind_path_key]
getter = getter_fn(key)
elem = object.__getattribute__(self, "_to_evaluate")
value = getter(elem)
rolled_down_value = AnalyzedCode._roll_down_to_literal(value)
if coercions._deep_is_literal(rolled_down_value):
wrapper = PyWrapper(self._sa_fn, key, value, getter=getter)
bind_paths[bind_path_key] = wrapper
return wrapper
else:
return value
@inspection._inspects(LambdaElement)
def insp(lmb):
return inspection.inspect(lmb._resolved)