Source code for pgtrigger.core

import contextlib
import copy
import hashlib
import inspect
import re

from django.db import DEFAULT_DB_ALIAS, models, router, transaction
from django.db.models.expressions import Col
from django.db.models.fields.related import RelatedField
from django.db.models.sql import Query
from django.db.models.sql.datastructures import BaseTable
from django.db.utils import ProgrammingError
import psycopg2.extensions

from pgtrigger import features
from pgtrigger import registry
from pgtrigger import utils


# Postgres only allows identifiers to be 63 chars max. Since "pgtrigger_"
# is the prefix for trigger names, and since an additional "_" and
# 5 character hash is added, the user-defined name of the trigger can only
# be 47 chars.
# NOTE: We can do something more sophisticated later by allowing users
# to name their triggers and then hashing the names when actually creating
# the triggers.
MAX_NAME_LENGTH = 47

# Installation states for a triggers
INSTALLED = "INSTALLED"
UNINSTALLED = "UNINSTALLED"
OUTDATED = "OUTDATED"
PRUNE = "PRUNE"
UNALLOWED = "UNALLOWED"


class _Serializable:
    def get_init_vals(self):
        """Returns class initialization args so that they are properly serialized for migrations"""
        parameters = inspect.signature(self.__init__).parameters

        for key, val in parameters.items():
            if key != "self" and (
                not hasattr(self, key) or val.kind == inspect.Parameter.VAR_KEYWORD
            ):  # pragma: no cover
                raise ValueError(
                    f"Could not automatically serialize Trigger {self.__class__} for migrations."
                    ' Implement "get_init_vals()" on the trigger class. See the'
                    " FAQ in the django-pgtrigger docs for more information."
                )

        args = tuple(
            item
            for key, val in parameters.items()
            if val.kind == inspect.Parameter.VAR_POSITIONAL
            for item in getattr(self, key)
        )

        kwargs = {
            key: getattr(self, key)
            for key, value in parameters.items()
            if key != "self" and val.kind != inspect.Parameter.VAR_POSITIONAL
        }

        return args, kwargs

    def deconstruct(self):
        """For supporting Django migrations"""
        path = f"{self.__class__.__module__}.{self.__class__.__name__}"
        path = path.replace("pgtrigger.core", "pgtrigger")
        path = path.replace("pgtrigger.contrib", "pgtrigger")
        args, kwargs = self.get_init_vals()
        return path, args, kwargs

    def __eq__(self, other):
        return self.__class__ == other.__class__ and self.get_init_vals() == other.get_init_vals()


class _Primitive(_Serializable):
    """Boilerplate for some of the primitive operations"""

    def __init__(self, name):
        assert name in self.values
        self.name = name

    def __str__(self):
        return self.name


class Level(_Primitive):
    values = ("ROW", "STATEMENT")


#: For specifying row-level triggers (the default)
Row = Level("ROW")

#: For specifying statement-level triggers
Statement = Level("STATEMENT")


[docs]class Referencing(_Serializable): """For specifying the REFERENCING clause of a statement-level trigger""" def __init__(self, *, old=None, new=None): if not old and not new: raise ValueError( 'Must provide either "old" and/or "new" to the referencing' " construct of a trigger" ) self.old = old self.new = new def __str__(self): ref = "REFERENCING" if self.old: ref += f" OLD TABLE AS {self.old} " if self.new: ref += f" NEW TABLE AS {self.new} " return ref
class When(_Primitive): values = ("BEFORE", "AFTER", "INSTEAD OF") #: For specifying ``BEFORE`` in the when clause of a trigger. Before = When("BEFORE") #: For specifying ``AFTER`` in the when clause of a trigger. After = When("AFTER") #: For specifying ``INSTEAD OF`` in the when clause of a trigger. InsteadOf = When("INSTEAD OF") class Operation(_Primitive): values = ("UPDATE", "DELETE", "TRUNCATE", "INSERT") def __or__(self, other): assert isinstance(other, Operation) return Operations(self, other) class Operations(Operation): """For providing multiple operations ``OR``ed together. Note that using the ``|`` operator is preferred syntax. """ def __init__(self, *operations): for operation in operations: assert isinstance(operation, Operation) self.operations = operations def __str__(self): return " OR ".join(str(operation) for operation in self.operations) #: For specifying ``UPDATE`` as the trigger operation. Update = Operation("UPDATE") #: For specifying ``DELETE`` as the trigger operation. Delete = Operation("DELETE") #: For specifying ``TRUNCATE`` as the trigger operation. Truncate = Operation("TRUNCATE") #: For specifying ``INSERT`` as the trigger operation. Insert = Operation("INSERT")
[docs]class UpdateOf(Operation): """For specifying ``UPDATE OF`` as the trigger operation.""" def __init__(self, *columns): if not columns: raise ValueError("Must provide at least one column") self.columns = columns def __str__(self): columns = ", ".join(f"{utils.quote(col)}" for col in self.columns) return f"UPDATE OF {columns}"
class Timing(_Primitive): values = ("IMMEDIATE", "DEFERRED") #: For deferrable triggers that run immediately by default Immediate = Timing("IMMEDIATE") #: For deferrable triggers that run at the end of the transaction by default Deferred = Timing("DEFERRED")
[docs]class Condition(_Serializable): """For specifying free-form SQL in the condition of a trigger.""" sql = None def __init__(self, sql=None): self.sql = sql or self.sql if not self.sql: raise ValueError("Must provide SQL to condition") def resolve(self, model): return self.sql
class _OldNewQuery(Query): """ A special Query object for referencing the ``OLD`` and ``NEW`` variables in a trigger. Only used by the `pgtrigger.Q` object. """ def build_lookup(self, lookups, lhs, rhs): # Django does not allow custom lookups on foreign keys, even though # DISTINCT FROM is a comnpletely valid lookup. Trick django into # being able to apply this lookup to related fields. if lookups == ["df"] and isinstance(lhs.output_field, RelatedField): lhs = copy.deepcopy(lhs) lhs.output_field = models.IntegerField(null=lhs.output_field.null) return super().build_lookup(lookups, lhs, rhs) def build_filter(self, filter_expr, *args, **kwargs): if isinstance(filter_expr, Q): return super().build_filter(filter_expr, *args, **kwargs) if filter_expr[0].startswith("old__"): alias = "OLD" elif filter_expr[0].startswith("new__"): alias = "NEW" else: # pragma: no cover raise ValueError("Filter expression on trigger.Q object must reference old__ or new__") filter_expr = (filter_expr[0][5:], filter_expr[1]) node, _ = super().build_filter(filter_expr, *args, **kwargs) self.alias_map[alias] = BaseTable(alias, alias) for child in node.children: child.lhs = Col( alias=alias, target=child.lhs.target, output_field=child.lhs.output_field, ) return node, {alias}
[docs]class F(models.F): """ Similar to Django's ``F`` object, allows referencing the old and new rows in a trigger condition. """ def __init__(self, *args, **kwargs): super().__init__(*args, **kwargs) if self.name.startswith("old__"): self.row_alias = "OLD" elif self.name.startswith("new__"): self.row_alias = "NEW" else: raise ValueError("F() values must reference old__ or new__") self.col_name = self.name[5:] def deconstruct(self): path, args, kwargs = super().deconstruct() path = path.replace("pgtrigger.core", "pgtrigger") return path, args, kwargs @property def resolved_name(self): return f"{self.row_alias}.{utils.quote(self.col_name)}" def resolve_expression(self, query=None, *args, **kwargs): return Col( alias=self.row_alias, target=query.model._meta.get_field(self.col_name), )
[docs]@models.fields.Field.register_lookup class IsDistinctFrom(models.Lookup): """ A custom ``IS DISTINCT FROM`` field lookup for common trigger conditions. For example, ``pgtrigger.Q(old__field__df=pgtrigger.F("new__field"))``. """ lookup_name = "df" def as_sql(self, compiler, connection): lhs, lhs_params = self.process_lhs(compiler, connection) rhs, rhs_params = self.process_rhs(compiler, connection) params = lhs_params + rhs_params return "%s IS DISTINCT FROM %s" % (lhs, rhs), params
[docs]@models.fields.Field.register_lookup class IsNotDistinctFrom(models.Lookup): """ A custom ``IS NOT DISTINCT FROM`` field lookup for common trigger conditions. For example, ``pgtrigger.Q(old__field__ndf=pgtrigger.F("new__field"))``. """ lookup_name = "ndf" def as_sql(self, compiler, connection): lhs, lhs_params = self.process_lhs(compiler, connection) rhs, rhs_params = self.process_rhs(compiler, connection) params = lhs_params + rhs_params return "%s IS NOT DISTINCT FROM %s" % (lhs, rhs), params
[docs]class Q(models.Q, Condition): """ Similar to Django's ``Q`` object, allows referencing the old and new rows in a trigger condition. """ def deconstruct(self): path, args, kwargs = super().deconstruct() path = path.replace("pgtrigger.core", "pgtrigger") return path, args, kwargs def resolve(self, model): query = _OldNewQuery(model) sql, args = self.resolve_expression(query).as_sql( compiler=query.get_compiler("default"), connection=utils.connection(), ) sql = sql.replace('"OLD"', "OLD").replace('"NEW"', "NEW") args = tuple(psycopg2.extensions.adapt(arg).getquoted().decode() for arg in args) return sql % args
# Allows Trigger methods to be used as context managers, mostly for # testing purposes @contextlib.contextmanager def _cleanup_on_exit(cleanup): yield cleanup() def _ignore_func_name(): ignore_func = "_pgtrigger_should_ignore" if features.schema(): # pragma: no branch ignore_func = f"{utils.quote(features.schema())}.{ignore_func}" return ignore_func def _render_ignore_func(): """ Triggers can be ignored dynamically by help of a special function that's installed. The definition of this function is here. Note: This function is global and shared by all triggers in the current implementation. It isn't uninstalled when triggers are uninstalled. """ return f""" CREATE OR REPLACE FUNCTION {_ignore_func_name()}( trigger_name NAME ) RETURNS BOOLEAN AS $$ DECLARE _pgtrigger_ignore TEXT[]; _result BOOLEAN; BEGIN BEGIN SELECT INTO _pgtrigger_ignore CURRENT_SETTING('pgtrigger.ignore'); EXCEPTION WHEN OTHERS THEN END; IF _pgtrigger_ignore IS NOT NULL THEN SELECT trigger_name = ANY(_pgtrigger_ignore) INTO _result; RETURN _result; ELSE RETURN FALSE; END IF; END; $$ LANGUAGE plpgsql; """
[docs]class Trigger(_Serializable): """ For specifying a free-form PL/pgSQL trigger function or for creating derived trigger classes. """ name = None level = Row when = None operation = None condition = None referencing = None func = None declare = None timing = None def __init__( self, *, name=None, level=None, when=None, operation=None, condition=None, referencing=None, func=None, declare=None, timing=None, ): self.name = name or self.name self.level = level or self.level self.when = when or self.when self.operation = operation or self.operation self.condition = condition or self.condition self.referencing = referencing or self.referencing self.func = func or self.func self.declare = declare or self.declare self.timing = timing or self.timing if not self.level or not isinstance(self.level, Level): raise ValueError(f'Invalid "level" attribute: {self.level}') if not self.when or not isinstance(self.when, When): raise ValueError(f'Invalid "when" attribute: {self.when}') if not self.operation or not isinstance(self.operation, Operation): raise ValueError(f'Invalid "operation" attribute: {self.operation}') if self.timing and not isinstance(self.timing, Timing): raise ValueError(f'Invalid "timing" attribute: {self.timing}') if self.level == Row and self.referencing: raise ValueError('Row-level triggers cannot have a "referencing" attribute') if self.timing and self.level != Row: raise ValueError('Deferrable triggers must have "level" attribute as "pgtrigger.Row"') if self.timing and self.when != After: raise ValueError('Deferrable triggers must have "when" attribute as "pgtrigger.After"') if not self.name: raise ValueError('Trigger must have "name" attribute') self.validate_name() def __str__(self): return self.name def validate_name(self): """Verifies the name is under the maximum length""" if len(self.name) > MAX_NAME_LENGTH: raise ValueError(f'Trigger name "{self.name}" > {MAX_NAME_LENGTH} characters.') if not re.match(r"^[a-zA-Z0-9-_]+$", self.name): raise ValueError( f'Trigger name "{self.name}" has invalid characters.' " Only alphanumeric characters, hyphens, and underscores are allowed." ) def get_pgid(self, model): """The ID of the trigger and function object in postgres All objects are prefixed with "pgtrigger_" in order to be discovered/managed by django-pgtrigger """ model_hash = hashlib.sha1(self.get_uri(model).encode()).hexdigest()[:5] pgid = f"pgtrigger_{self.name}_{model_hash}" if len(pgid) > 63: raise ValueError(f'Trigger identifier "{pgid}" is greater than 63 chars') # NOTE - Postgres always stores names in lowercase. Ensure that all # generated IDs are lowercase so that we can properly do installation # and pruning tasks. return pgid.lower() def get_hash(self, model): """ Computes a hash for the trigger, which is used to uniquely identify its contents. The hash is computed based on the trigger function and declaration. Note: If the trigger definition includes dynamic data, such as the current time, the trigger hash will always change and appear to be out of sync. """ rendered_func = self.render_func(model) rendered_trigger = self.render_trigger(model) return hashlib.sha1(f"{rendered_func} {rendered_trigger}".encode()).hexdigest() def get_condition(self, model): return self.condition def get_declare(self, model): """ Gets the DECLARE part of the trigger function if any variables are used. Returns: List[tuple]: A list of variable name / type tuples that will be shown in the DECLARE. For example [('row_data', 'JSONB')] """ return self.declare or [] def get_func(self, model): """ Returns the trigger function that comes between the BEGIN and END clause """ if not self.func: raise ValueError("Must define func attribute or implement get_func") return self.func def get_uri(self, model): """The URI for the trigger""" return f"{model._meta.app_label}.{model._meta.object_name}:{self.name}" def render_condition(self, model): """Renders the condition SQL in the trigger declaration""" condition = self.get_condition(model) resolved = condition.resolve(model).strip() if condition else "" if resolved: if not resolved.startswith("("): resolved = f"({resolved})" resolved = f"WHEN {resolved}" return resolved def render_declare(self, model): """Renders the DECLARE of the trigger function, if any""" declare = self.get_declare(model) if declare: rendered_declare = "DECLARE \n" + "\n".join( f"{var_name} {var_type};" for var_name, var_type in declare ) else: rendered_declare = "" return rendered_declare def render_ignore(self, model): """ Renders the clause that can dynamically ignore the trigger's execution """ return f""" IF ({_ignore_func_name()}(TG_NAME) IS TRUE) THEN IF (TG_OP = 'DELETE') THEN RETURN OLD; ELSE RETURN NEW; END IF; END IF; """ def render_func(self, model): """Renders the trigger function SQL statement""" return f""" CREATE OR REPLACE FUNCTION {self.get_pgid(model)}() RETURNS TRIGGER AS $$ {self.render_declare(model)} BEGIN {self.render_ignore(model)} {self.get_func(model)} END; $$ LANGUAGE plpgsql; """ def render_trigger(self, model, function=None): """Renders the trigger declaration SQL statement Args: model (``models.Model``): The Django model over which the trigger will run. function (str, default=None): The function that will be called by the trigger. Defaults to the function that's automatically created for the trigger. """ table = model._meta.db_table pgid = self.get_pgid(model) function = function or f"{pgid}()" constraint = "CONSTRAINT" if self.timing else "" timing = f"DEFERRABLE INITIALLY {self.timing}" if self.timing else "" # Note: Postgres 14 has CREATE OR REPLACE syntax that # we might consider using. return f""" DROP TRIGGER IF EXISTS {pgid} on {utils.quote(table)}; CREATE {constraint} TRIGGER {pgid} {self.when} {self.operation} ON {utils.quote(table)} {timing} {self.referencing or ''} FOR EACH {self.level} {self.render_condition(model)} EXECUTE PROCEDURE {function}; """ def render_comment(self, model): """Renders the trigger commment SQL statement pgtrigger comments the hash of the trigger in order for us to determine if the trigger definition has changed """ pgid = self.get_pgid(model) hash = self.get_hash(model) table = model._meta.db_table return f"COMMENT ON TRIGGER {pgid} ON {utils.quote(table)} IS '{hash}'" def render_install(self, model): ignore_func = _render_ignore_func() rendered_func = self.render_func(model) rendered_trigger = self.render_trigger(model) rendered_comment = self.render_comment(model) return f"{ignore_func}; {rendered_func}; {rendered_trigger}; {rendered_comment};" def render_uninstall(self, model): return utils.render_uninstall(model._meta.db_table, self.get_pgid(model)) def allow_migrate(self, model, database=None): """True if the trigger for this model can be migrated. Defaults to using the router's allow_migrate """ model = model._meta.concrete_model return utils.is_postgres(database) and router.allow_migrate( database or DEFAULT_DB_ALIAS, model._meta.app_label, model_name=model._meta.model_name ) def exec_sql(self, sql, model, database=None, fetchall=False): """Conditionally execute SQL if migrations are allowed""" if self.allow_migrate(model, database=database): return utils.exec_sql(sql, database=database, fetchall=fetchall) def get_installation_status(self, model, database=None): """Returns the installation status of a trigger. The return type is (status, enabled), where status is one of: 1. ``INSTALLED``: If the trigger is installed 2. ``UNINSTALLED``: If the trigger is not installed 3. ``OUTDATED``: If the trigger is installed but has been modified 4. ``IGNORED``: If migrations are not allowed "enabled" is True if the trigger is installed and enabled or false if installed and disabled (or uninstalled). """ if not self.allow_migrate(model, database=database): return (UNALLOWED, None) trigger_exists_sql = f""" SELECT oid, obj_description(oid) AS hash, tgenabled AS enabled FROM pg_trigger WHERE tgname='{self.get_pgid(model)}' AND tgrelid='{utils.quote(model._meta.db_table)}'::regclass; """ try: with transaction.atomic(using=database): results = self.exec_sql( trigger_exists_sql, model, database=database, fetchall=True ) except ProgrammingError: # pragma: no cover # When the table doesn't exist yet, possibly because migrations # haven't been executed, a ProgrammingError will happen because # of an invalid regclass cast. Return 'UNINSTALLED' for this # case return (UNINSTALLED, None) if not results: return (UNINSTALLED, None) else: hash = self.get_hash(model) if hash != results[0][1]: return (OUTDATED, results[0][2] == "O") else: return (INSTALLED, results[0][2] == "O") def register(self, *models): """Register model classes with the trigger""" for model in models: registry.set(self.get_uri(model), model=model, trigger=self) return _cleanup_on_exit(lambda: self.unregister(*models)) def unregister(self, *models): """Unregister model classes with the trigger""" for model in models: registry.delete(self.get_uri(model)) return _cleanup_on_exit(lambda: self.register(*models)) def install(self, model, database=None): """Installs the trigger for a model""" install_sql = self.render_install(model) with transaction.atomic(using=database): self.exec_sql(install_sql, model, database=database) return _cleanup_on_exit(lambda: self.uninstall(model, database=database)) def uninstall(self, model, database=None): """Uninstalls the trigger for a model""" uninstall_sql = self.render_uninstall(model) self.exec_sql(uninstall_sql, model, database=database) return _cleanup_on_exit( # pragma: no branch lambda: self.install(model, database=database) ) def enable(self, model, database=None): """Enables the trigger for a model""" enable_sql = ( f"ALTER TABLE {utils.quote(model._meta.db_table)}" f" ENABLE TRIGGER {self.get_pgid(model)};" ) self.exec_sql(enable_sql, model, database=database) return _cleanup_on_exit( # pragma: no branch lambda: self.disable(model, database=database) ) def disable(self, model, database=None): """Disables the trigger for a model""" disable_sql = ( f"ALTER TABLE {utils.quote(model._meta.db_table)}" f" DISABLE TRIGGER {self.get_pgid(model)};" ) self.exec_sql(disable_sql, model, database=database) return _cleanup_on_exit(lambda: self.enable(model, database=database)) # pragma: no branch