indexes.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297
  1. from types import NoneType
  2. from django.db.backends.utils import names_digest, split_identifier
  3. from django.db.models.expressions import Col, ExpressionList, F, Func, OrderBy
  4. from django.db.models.functions import Collate
  5. from django.db.models.query_utils import Q
  6. from django.db.models.sql import Query
  7. from django.utils.functional import partition
  8. __all__ = ["Index"]
  9. class Index:
  10. suffix = "idx"
  11. # The max length of the name of the index (restricted to 30 for
  12. # cross-database compatibility with Oracle)
  13. max_name_length = 30
  14. def __init__(
  15. self,
  16. *expressions,
  17. fields=(),
  18. name=None,
  19. db_tablespace=None,
  20. opclasses=(),
  21. condition=None,
  22. include=None,
  23. ):
  24. if opclasses and not name:
  25. raise ValueError("An index must be named to use opclasses.")
  26. if not isinstance(condition, (NoneType, Q)):
  27. raise ValueError("Index.condition must be a Q instance.")
  28. if condition and not name:
  29. raise ValueError("An index must be named to use condition.")
  30. if not isinstance(fields, (list, tuple)):
  31. raise ValueError("Index.fields must be a list or tuple.")
  32. if not isinstance(opclasses, (list, tuple)):
  33. raise ValueError("Index.opclasses must be a list or tuple.")
  34. if not expressions and not fields:
  35. raise ValueError(
  36. "At least one field or expression is required to define an index."
  37. )
  38. if expressions and fields:
  39. raise ValueError(
  40. "Index.fields and expressions are mutually exclusive.",
  41. )
  42. if expressions and not name:
  43. raise ValueError("An index must be named to use expressions.")
  44. if expressions and opclasses:
  45. raise ValueError(
  46. "Index.opclasses cannot be used with expressions. Use "
  47. "django.contrib.postgres.indexes.OpClass() instead."
  48. )
  49. if opclasses and len(fields) != len(opclasses):
  50. raise ValueError(
  51. "Index.fields and Index.opclasses must have the same number of "
  52. "elements."
  53. )
  54. if fields and not all(isinstance(field, str) for field in fields):
  55. raise ValueError("Index.fields must contain only strings with field names.")
  56. if include and not name:
  57. raise ValueError("A covering index must be named.")
  58. if not isinstance(include, (NoneType, list, tuple)):
  59. raise ValueError("Index.include must be a list or tuple.")
  60. self.fields = list(fields)
  61. # A list of 2-tuple with the field name and ordering ('' or 'DESC').
  62. self.fields_orders = [
  63. (field_name.removeprefix("-"), "DESC" if field_name.startswith("-") else "")
  64. for field_name in self.fields
  65. ]
  66. self.name = name or ""
  67. self.db_tablespace = db_tablespace
  68. self.opclasses = opclasses
  69. self.condition = condition
  70. self.include = tuple(include) if include else ()
  71. self.expressions = tuple(
  72. F(expression) if isinstance(expression, str) else expression
  73. for expression in expressions
  74. )
  75. @property
  76. def contains_expressions(self):
  77. return bool(self.expressions)
  78. def _get_condition_sql(self, model, schema_editor):
  79. if self.condition is None:
  80. return None
  81. query = Query(model=model, alias_cols=False)
  82. where = query.build_where(self.condition)
  83. compiler = query.get_compiler(connection=schema_editor.connection)
  84. sql, params = where.as_sql(compiler, schema_editor.connection)
  85. return sql % tuple(schema_editor.quote_value(p) for p in params)
  86. def create_sql(self, model, schema_editor, using="", **kwargs):
  87. include = [
  88. model._meta.get_field(field_name).column for field_name in self.include
  89. ]
  90. condition = self._get_condition_sql(model, schema_editor)
  91. if self.expressions:
  92. index_expressions = []
  93. for expression in self.expressions:
  94. index_expression = IndexExpression(expression)
  95. index_expression.set_wrapper_classes(schema_editor.connection)
  96. index_expressions.append(index_expression)
  97. expressions = ExpressionList(*index_expressions).resolve_expression(
  98. Query(model, alias_cols=False),
  99. )
  100. fields = None
  101. col_suffixes = None
  102. else:
  103. fields = [
  104. model._meta.get_field(field_name)
  105. for field_name, _ in self.fields_orders
  106. ]
  107. if schema_editor.connection.features.supports_index_column_ordering:
  108. col_suffixes = [order[1] for order in self.fields_orders]
  109. else:
  110. col_suffixes = [""] * len(self.fields_orders)
  111. expressions = None
  112. return schema_editor._create_index_sql(
  113. model,
  114. fields=fields,
  115. name=self.name,
  116. using=using,
  117. db_tablespace=self.db_tablespace,
  118. col_suffixes=col_suffixes,
  119. opclasses=self.opclasses,
  120. condition=condition,
  121. include=include,
  122. expressions=expressions,
  123. **kwargs,
  124. )
  125. def remove_sql(self, model, schema_editor, **kwargs):
  126. return schema_editor._delete_index_sql(model, self.name, **kwargs)
  127. def deconstruct(self):
  128. path = "%s.%s" % (self.__class__.__module__, self.__class__.__name__)
  129. path = path.replace("django.db.models.indexes", "django.db.models")
  130. kwargs = {"name": self.name}
  131. if self.fields:
  132. kwargs["fields"] = self.fields
  133. if self.db_tablespace is not None:
  134. kwargs["db_tablespace"] = self.db_tablespace
  135. if self.opclasses:
  136. kwargs["opclasses"] = self.opclasses
  137. if self.condition:
  138. kwargs["condition"] = self.condition
  139. if self.include:
  140. kwargs["include"] = self.include
  141. return (path, self.expressions, kwargs)
  142. def clone(self):
  143. """Create a copy of this Index."""
  144. _, args, kwargs = self.deconstruct()
  145. return self.__class__(*args, **kwargs)
  146. def set_name_with_model(self, model):
  147. """
  148. Generate a unique name for the index.
  149. The name is divided into 3 parts - table name (12 chars), field name
  150. (8 chars) and unique hash + suffix (10 chars). Each part is made to
  151. fit its size by truncating the excess length.
  152. """
  153. _, table_name = split_identifier(model._meta.db_table)
  154. column_names = [
  155. model._meta.get_field(field_name).column
  156. for field_name, order in self.fields_orders
  157. ]
  158. column_names_with_order = [
  159. (("-%s" if order else "%s") % column_name)
  160. for column_name, (field_name, order) in zip(
  161. column_names, self.fields_orders
  162. )
  163. ]
  164. # The length of the parts of the name is based on the default max
  165. # length of 30 characters.
  166. hash_data = [table_name] + column_names_with_order + [self.suffix]
  167. self.name = "%s_%s_%s" % (
  168. table_name[:11],
  169. column_names[0][:7],
  170. "%s_%s" % (names_digest(*hash_data, length=6), self.suffix),
  171. )
  172. if len(self.name) > self.max_name_length:
  173. raise ValueError(
  174. "Index too long for multiple database support. Is self.suffix "
  175. "longer than 3 characters?"
  176. )
  177. if self.name[0] == "_" or self.name[0].isdigit():
  178. self.name = "D%s" % self.name[1:]
  179. def __repr__(self):
  180. return "<%s:%s%s%s%s%s%s%s>" % (
  181. self.__class__.__qualname__,
  182. "" if not self.fields else " fields=%s" % repr(self.fields),
  183. "" if not self.expressions else " expressions=%s" % repr(self.expressions),
  184. "" if not self.name else " name=%s" % repr(self.name),
  185. ""
  186. if self.db_tablespace is None
  187. else " db_tablespace=%s" % repr(self.db_tablespace),
  188. "" if self.condition is None else " condition=%s" % self.condition,
  189. "" if not self.include else " include=%s" % repr(self.include),
  190. "" if not self.opclasses else " opclasses=%s" % repr(self.opclasses),
  191. )
  192. def __eq__(self, other):
  193. if self.__class__ == other.__class__:
  194. return self.deconstruct() == other.deconstruct()
  195. return NotImplemented
  196. class IndexExpression(Func):
  197. """Order and wrap expressions for CREATE INDEX statements."""
  198. template = "%(expressions)s"
  199. wrapper_classes = (OrderBy, Collate)
  200. def set_wrapper_classes(self, connection=None):
  201. # Some databases (e.g. MySQL) treats COLLATE as an indexed expression.
  202. if connection and connection.features.collate_as_index_expression:
  203. self.wrapper_classes = tuple(
  204. [
  205. wrapper_cls
  206. for wrapper_cls in self.wrapper_classes
  207. if wrapper_cls is not Collate
  208. ]
  209. )
  210. @classmethod
  211. def register_wrappers(cls, *wrapper_classes):
  212. cls.wrapper_classes = wrapper_classes
  213. def resolve_expression(
  214. self,
  215. query=None,
  216. allow_joins=True,
  217. reuse=None,
  218. summarize=False,
  219. for_save=False,
  220. ):
  221. expressions = list(self.flatten())
  222. # Split expressions and wrappers.
  223. index_expressions, wrappers = partition(
  224. lambda e: isinstance(e, self.wrapper_classes),
  225. expressions,
  226. )
  227. wrapper_types = [type(wrapper) for wrapper in wrappers]
  228. if len(wrapper_types) != len(set(wrapper_types)):
  229. raise ValueError(
  230. "Multiple references to %s can't be used in an indexed "
  231. "expression."
  232. % ", ".join(
  233. [wrapper_cls.__qualname__ for wrapper_cls in self.wrapper_classes]
  234. )
  235. )
  236. if expressions[1 : len(wrappers) + 1] != wrappers:
  237. raise ValueError(
  238. "%s must be topmost expressions in an indexed expression."
  239. % ", ".join(
  240. [wrapper_cls.__qualname__ for wrapper_cls in self.wrapper_classes]
  241. )
  242. )
  243. # Wrap expressions in parentheses if they are not column references.
  244. root_expression = index_expressions[1]
  245. resolve_root_expression = root_expression.resolve_expression(
  246. query,
  247. allow_joins,
  248. reuse,
  249. summarize,
  250. for_save,
  251. )
  252. if not isinstance(resolve_root_expression, Col):
  253. root_expression = Func(root_expression, template="(%(expressions)s)")
  254. if wrappers:
  255. # Order wrappers and set their expressions.
  256. wrappers = sorted(
  257. wrappers,
  258. key=lambda w: self.wrapper_classes.index(type(w)),
  259. )
  260. wrappers = [wrapper.copy() for wrapper in wrappers]
  261. for i, wrapper in enumerate(wrappers[:-1]):
  262. wrapper.set_source_expressions([wrappers[i + 1]])
  263. # Set the root expression on the deepest wrapper.
  264. wrappers[-1].set_source_expressions([root_expression])
  265. self.set_source_expressions([wrappers[0]])
  266. else:
  267. # Use the root expression, if there are no wrappers.
  268. self.set_source_expressions([root_expression])
  269. return super().resolve_expression(
  270. query, allow_joins, reuse, summarize, for_save
  271. )
  272. def as_sqlite(self, compiler, connection, **extra_context):
  273. # Casting to numeric is unnecessary.
  274. return self.as_sql(compiler, connection, **extra_context)