serializer.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395
  1. import builtins
  2. import collections.abc
  3. import datetime
  4. import decimal
  5. import enum
  6. import functools
  7. import math
  8. import os
  9. import pathlib
  10. import re
  11. import types
  12. import uuid
  13. from django.conf import SettingsReference
  14. from django.db import models
  15. from django.db.migrations.operations.base import Operation
  16. from django.db.migrations.utils import COMPILED_REGEX_TYPE, RegexObject
  17. from django.utils.functional import LazyObject, Promise
  18. from django.utils.version import PY311, get_docs_version
  19. class BaseSerializer:
  20. def __init__(self, value):
  21. self.value = value
  22. def serialize(self):
  23. raise NotImplementedError(
  24. "Subclasses of BaseSerializer must implement the serialize() method."
  25. )
  26. class BaseSequenceSerializer(BaseSerializer):
  27. def _format(self):
  28. raise NotImplementedError(
  29. "Subclasses of BaseSequenceSerializer must implement the _format() method."
  30. )
  31. def serialize(self):
  32. imports = set()
  33. strings = []
  34. for item in self.value:
  35. item_string, item_imports = serializer_factory(item).serialize()
  36. imports.update(item_imports)
  37. strings.append(item_string)
  38. value = self._format()
  39. return value % (", ".join(strings)), imports
  40. class BaseSimpleSerializer(BaseSerializer):
  41. def serialize(self):
  42. return repr(self.value), set()
  43. class ChoicesSerializer(BaseSerializer):
  44. def serialize(self):
  45. return serializer_factory(self.value.value).serialize()
  46. class DateTimeSerializer(BaseSerializer):
  47. """For datetime.*, except datetime.datetime."""
  48. def serialize(self):
  49. return repr(self.value), {"import datetime"}
  50. class DatetimeDatetimeSerializer(BaseSerializer):
  51. """For datetime.datetime."""
  52. def serialize(self):
  53. if self.value.tzinfo is not None and self.value.tzinfo != datetime.timezone.utc:
  54. self.value = self.value.astimezone(datetime.timezone.utc)
  55. imports = ["import datetime"]
  56. return repr(self.value), set(imports)
  57. class DecimalSerializer(BaseSerializer):
  58. def serialize(self):
  59. return repr(self.value), {"from decimal import Decimal"}
  60. class DeconstructableSerializer(BaseSerializer):
  61. @staticmethod
  62. def serialize_deconstructed(path, args, kwargs):
  63. name, imports = DeconstructableSerializer._serialize_path(path)
  64. strings = []
  65. for arg in args:
  66. arg_string, arg_imports = serializer_factory(arg).serialize()
  67. strings.append(arg_string)
  68. imports.update(arg_imports)
  69. for kw, arg in sorted(kwargs.items()):
  70. arg_string, arg_imports = serializer_factory(arg).serialize()
  71. imports.update(arg_imports)
  72. strings.append("%s=%s" % (kw, arg_string))
  73. return "%s(%s)" % (name, ", ".join(strings)), imports
  74. @staticmethod
  75. def _serialize_path(path):
  76. module, name = path.rsplit(".", 1)
  77. if module == "django.db.models":
  78. imports = {"from django.db import models"}
  79. name = "models.%s" % name
  80. else:
  81. imports = {"import %s" % module}
  82. name = path
  83. return name, imports
  84. def serialize(self):
  85. return self.serialize_deconstructed(*self.value.deconstruct())
  86. class DictionarySerializer(BaseSerializer):
  87. def serialize(self):
  88. imports = set()
  89. strings = []
  90. for k, v in sorted(self.value.items()):
  91. k_string, k_imports = serializer_factory(k).serialize()
  92. v_string, v_imports = serializer_factory(v).serialize()
  93. imports.update(k_imports)
  94. imports.update(v_imports)
  95. strings.append((k_string, v_string))
  96. return "{%s}" % (", ".join("%s: %s" % (k, v) for k, v in strings)), imports
  97. class EnumSerializer(BaseSerializer):
  98. def serialize(self):
  99. enum_class = self.value.__class__
  100. module = enum_class.__module__
  101. if issubclass(enum_class, enum.Flag):
  102. if PY311:
  103. members = list(self.value)
  104. else:
  105. members, _ = enum._decompose(enum_class, self.value)
  106. members = reversed(members)
  107. else:
  108. members = (self.value,)
  109. return (
  110. " | ".join(
  111. [
  112. f"{module}.{enum_class.__qualname__}[{item.name!r}]"
  113. for item in members
  114. ]
  115. ),
  116. {"import %s" % module},
  117. )
  118. class FloatSerializer(BaseSimpleSerializer):
  119. def serialize(self):
  120. if math.isnan(self.value) or math.isinf(self.value):
  121. return 'float("{}")'.format(self.value), set()
  122. return super().serialize()
  123. class FrozensetSerializer(BaseSequenceSerializer):
  124. def _format(self):
  125. return "frozenset([%s])"
  126. class FunctionTypeSerializer(BaseSerializer):
  127. def serialize(self):
  128. if getattr(self.value, "__self__", None) and isinstance(
  129. self.value.__self__, type
  130. ):
  131. klass = self.value.__self__
  132. module = klass.__module__
  133. return "%s.%s.%s" % (module, klass.__name__, self.value.__name__), {
  134. "import %s" % module
  135. }
  136. # Further error checking
  137. if self.value.__name__ == "<lambda>":
  138. raise ValueError("Cannot serialize function: lambda")
  139. if self.value.__module__ is None:
  140. raise ValueError("Cannot serialize function %r: No module" % self.value)
  141. module_name = self.value.__module__
  142. if "<" not in self.value.__qualname__: # Qualname can include <locals>
  143. return "%s.%s" % (module_name, self.value.__qualname__), {
  144. "import %s" % self.value.__module__
  145. }
  146. raise ValueError(
  147. "Could not find function %s in %s.\n" % (self.value.__name__, module_name)
  148. )
  149. class FunctoolsPartialSerializer(BaseSerializer):
  150. def serialize(self):
  151. # Serialize functools.partial() arguments
  152. func_string, func_imports = serializer_factory(self.value.func).serialize()
  153. args_string, args_imports = serializer_factory(self.value.args).serialize()
  154. keywords_string, keywords_imports = serializer_factory(
  155. self.value.keywords
  156. ).serialize()
  157. # Add any imports needed by arguments
  158. imports = {"import functools", *func_imports, *args_imports, *keywords_imports}
  159. return (
  160. "functools.%s(%s, *%s, **%s)"
  161. % (
  162. self.value.__class__.__name__,
  163. func_string,
  164. args_string,
  165. keywords_string,
  166. ),
  167. imports,
  168. )
  169. class IterableSerializer(BaseSerializer):
  170. def serialize(self):
  171. imports = set()
  172. strings = []
  173. for item in self.value:
  174. item_string, item_imports = serializer_factory(item).serialize()
  175. imports.update(item_imports)
  176. strings.append(item_string)
  177. # When len(strings)==0, the empty iterable should be serialized as
  178. # "()", not "(,)" because (,) is invalid Python syntax.
  179. value = "(%s)" if len(strings) != 1 else "(%s,)"
  180. return value % (", ".join(strings)), imports
  181. class ModelFieldSerializer(DeconstructableSerializer):
  182. def serialize(self):
  183. attr_name, path, args, kwargs = self.value.deconstruct()
  184. return self.serialize_deconstructed(path, args, kwargs)
  185. class ModelManagerSerializer(DeconstructableSerializer):
  186. def serialize(self):
  187. as_manager, manager_path, qs_path, args, kwargs = self.value.deconstruct()
  188. if as_manager:
  189. name, imports = self._serialize_path(qs_path)
  190. return "%s.as_manager()" % name, imports
  191. else:
  192. return self.serialize_deconstructed(manager_path, args, kwargs)
  193. class OperationSerializer(BaseSerializer):
  194. def serialize(self):
  195. from django.db.migrations.writer import OperationWriter
  196. string, imports = OperationWriter(self.value, indentation=0).serialize()
  197. # Nested operation, trailing comma is handled in upper OperationWriter._write()
  198. return string.rstrip(","), imports
  199. class PathLikeSerializer(BaseSerializer):
  200. def serialize(self):
  201. return repr(os.fspath(self.value)), {}
  202. class PathSerializer(BaseSerializer):
  203. def serialize(self):
  204. # Convert concrete paths to pure paths to avoid issues with migrations
  205. # generated on one platform being used on a different platform.
  206. prefix = "Pure" if isinstance(self.value, pathlib.Path) else ""
  207. return "pathlib.%s%r" % (prefix, self.value), {"import pathlib"}
  208. class RegexSerializer(BaseSerializer):
  209. def serialize(self):
  210. regex_pattern, pattern_imports = serializer_factory(
  211. self.value.pattern
  212. ).serialize()
  213. # Turn off default implicit flags (e.g. re.U) because regexes with the
  214. # same implicit and explicit flags aren't equal.
  215. flags = self.value.flags ^ re.compile("").flags
  216. regex_flags, flag_imports = serializer_factory(flags).serialize()
  217. imports = {"import re", *pattern_imports, *flag_imports}
  218. args = [regex_pattern]
  219. if flags:
  220. args.append(regex_flags)
  221. return "re.compile(%s)" % ", ".join(args), imports
  222. class SequenceSerializer(BaseSequenceSerializer):
  223. def _format(self):
  224. return "[%s]"
  225. class SetSerializer(BaseSequenceSerializer):
  226. def _format(self):
  227. # Serialize as a set literal except when value is empty because {}
  228. # is an empty dict.
  229. return "{%s}" if self.value else "set(%s)"
  230. class SettingsReferenceSerializer(BaseSerializer):
  231. def serialize(self):
  232. return "settings.%s" % self.value.setting_name, {
  233. "from django.conf import settings"
  234. }
  235. class TupleSerializer(BaseSequenceSerializer):
  236. def _format(self):
  237. # When len(value)==0, the empty tuple should be serialized as "()",
  238. # not "(,)" because (,) is invalid Python syntax.
  239. return "(%s)" if len(self.value) != 1 else "(%s,)"
  240. class TypeSerializer(BaseSerializer):
  241. def serialize(self):
  242. special_cases = [
  243. (models.Model, "models.Model", ["from django.db import models"]),
  244. (type(None), "type(None)", []),
  245. ]
  246. for case, string, imports in special_cases:
  247. if case is self.value:
  248. return string, set(imports)
  249. if hasattr(self.value, "__module__"):
  250. module = self.value.__module__
  251. if module == builtins.__name__:
  252. return self.value.__name__, set()
  253. else:
  254. return "%s.%s" % (module, self.value.__qualname__), {
  255. "import %s" % module
  256. }
  257. class UUIDSerializer(BaseSerializer):
  258. def serialize(self):
  259. return "uuid.%s" % repr(self.value), {"import uuid"}
  260. class Serializer:
  261. _registry = {
  262. # Some of these are order-dependent.
  263. frozenset: FrozensetSerializer,
  264. list: SequenceSerializer,
  265. set: SetSerializer,
  266. tuple: TupleSerializer,
  267. dict: DictionarySerializer,
  268. models.Choices: ChoicesSerializer,
  269. enum.Enum: EnumSerializer,
  270. datetime.datetime: DatetimeDatetimeSerializer,
  271. (datetime.date, datetime.timedelta, datetime.time): DateTimeSerializer,
  272. SettingsReference: SettingsReferenceSerializer,
  273. float: FloatSerializer,
  274. (bool, int, type(None), bytes, str, range): BaseSimpleSerializer,
  275. decimal.Decimal: DecimalSerializer,
  276. (functools.partial, functools.partialmethod): FunctoolsPartialSerializer,
  277. (
  278. types.FunctionType,
  279. types.BuiltinFunctionType,
  280. types.MethodType,
  281. ): FunctionTypeSerializer,
  282. collections.abc.Iterable: IterableSerializer,
  283. (COMPILED_REGEX_TYPE, RegexObject): RegexSerializer,
  284. uuid.UUID: UUIDSerializer,
  285. pathlib.PurePath: PathSerializer,
  286. os.PathLike: PathLikeSerializer,
  287. }
  288. @classmethod
  289. def register(cls, type_, serializer):
  290. if not issubclass(serializer, BaseSerializer):
  291. raise ValueError(
  292. "'%s' must inherit from 'BaseSerializer'." % serializer.__name__
  293. )
  294. cls._registry[type_] = serializer
  295. @classmethod
  296. def unregister(cls, type_):
  297. cls._registry.pop(type_)
  298. def serializer_factory(value):
  299. if isinstance(value, Promise):
  300. value = str(value)
  301. elif isinstance(value, LazyObject):
  302. # The unwrapped value is returned as the first item of the arguments
  303. # tuple.
  304. value = value.__reduce__()[1][0]
  305. if isinstance(value, models.Field):
  306. return ModelFieldSerializer(value)
  307. if isinstance(value, models.manager.BaseManager):
  308. return ModelManagerSerializer(value)
  309. if isinstance(value, Operation):
  310. return OperationSerializer(value)
  311. if isinstance(value, type):
  312. return TypeSerializer(value)
  313. # Anything that knows how to deconstruct itself.
  314. if hasattr(value, "deconstruct"):
  315. return DeconstructableSerializer(value)
  316. for type_, serializer_cls in Serializer._registry.items():
  317. if isinstance(value, type_):
  318. return serializer_cls(value)
  319. raise ValueError(
  320. "Cannot serialize: %r\nThere are some values Django cannot serialize into "
  321. "migration files.\nFor more, see https://docs.djangoproject.com/en/%s/"
  322. "topics/migrations/#migration-serializing" % (value, get_docs_version())
  323. )