serializer.py 6.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185
  1. # ext/serializer.py
  2. # Copyright (C) 2005-2025 the SQLAlchemy authors and contributors
  3. # <see AUTHORS file>
  4. #
  5. # This module is part of SQLAlchemy and is released under
  6. # the MIT License: https://www.opensource.org/licenses/mit-license.php
  7. # mypy: ignore-errors
  8. """Serializer/Deserializer objects for usage with SQLAlchemy query structures,
  9. allowing "contextual" deserialization.
  10. .. legacy::
  11. The serializer extension is **legacy** and should not be used for
  12. new development.
  13. Any SQLAlchemy query structure, either based on sqlalchemy.sql.*
  14. or sqlalchemy.orm.* can be used. The mappers, Tables, Columns, Session
  15. etc. which are referenced by the structure are not persisted in serialized
  16. form, but are instead re-associated with the query structure
  17. when it is deserialized.
  18. .. warning:: The serializer extension uses pickle to serialize and
  19. deserialize objects, so the same security consideration mentioned
  20. in the `python documentation
  21. <https://docs.python.org/3/library/pickle.html>`_ apply.
  22. Usage is nearly the same as that of the standard Python pickle module::
  23. from sqlalchemy.ext.serializer import loads, dumps
  24. metadata = MetaData(bind=some_engine)
  25. Session = scoped_session(sessionmaker())
  26. # ... define mappers
  27. query = (
  28. Session.query(MyClass)
  29. .filter(MyClass.somedata == "foo")
  30. .order_by(MyClass.sortkey)
  31. )
  32. # pickle the query
  33. serialized = dumps(query)
  34. # unpickle. Pass in metadata + scoped_session
  35. query2 = loads(serialized, metadata, Session)
  36. print(query2.all())
  37. Similar restrictions as when using raw pickle apply; mapped classes must be
  38. themselves be pickleable, meaning they are importable from a module-level
  39. namespace.
  40. The serializer module is only appropriate for query structures. It is not
  41. needed for:
  42. * instances of user-defined classes. These contain no references to engines,
  43. sessions or expression constructs in the typical case and can be serialized
  44. directly.
  45. * Table metadata that is to be loaded entirely from the serialized structure
  46. (i.e. is not already declared in the application). Regular
  47. pickle.loads()/dumps() can be used to fully dump any ``MetaData`` object,
  48. typically one which was reflected from an existing database at some previous
  49. point in time. The serializer module is specifically for the opposite case,
  50. where the Table metadata is already present in memory.
  51. """
  52. from io import BytesIO
  53. import pickle
  54. import re
  55. from .. import Column
  56. from .. import Table
  57. from ..engine import Engine
  58. from ..orm import class_mapper
  59. from ..orm.interfaces import MapperProperty
  60. from ..orm.mapper import Mapper
  61. from ..orm.session import Session
  62. from ..util import b64decode
  63. from ..util import b64encode
  64. __all__ = ["Serializer", "Deserializer", "dumps", "loads"]
  65. class Serializer(pickle.Pickler):
  66. def persistent_id(self, obj):
  67. # print "serializing:", repr(obj)
  68. if isinstance(obj, Mapper) and not obj.non_primary:
  69. id_ = "mapper:" + b64encode(pickle.dumps(obj.class_))
  70. elif isinstance(obj, MapperProperty) and not obj.parent.non_primary:
  71. id_ = (
  72. "mapperprop:"
  73. + b64encode(pickle.dumps(obj.parent.class_))
  74. + ":"
  75. + obj.key
  76. )
  77. elif isinstance(obj, Table):
  78. if "parententity" in obj._annotations:
  79. id_ = "mapper_selectable:" + b64encode(
  80. pickle.dumps(obj._annotations["parententity"].class_)
  81. )
  82. else:
  83. id_ = f"table:{obj.key}"
  84. elif isinstance(obj, Column) and isinstance(obj.table, Table):
  85. id_ = f"column:{obj.table.key}:{obj.key}"
  86. elif isinstance(obj, Session):
  87. id_ = "session:"
  88. elif isinstance(obj, Engine):
  89. id_ = "engine:"
  90. else:
  91. return None
  92. return id_
  93. our_ids = re.compile(
  94. r"(mapperprop|mapper|mapper_selectable|table|column|"
  95. r"session|attribute|engine):(.*)"
  96. )
  97. class Deserializer(pickle.Unpickler):
  98. def __init__(self, file, metadata=None, scoped_session=None, engine=None):
  99. super().__init__(file)
  100. self.metadata = metadata
  101. self.scoped_session = scoped_session
  102. self.engine = engine
  103. def get_engine(self):
  104. if self.engine:
  105. return self.engine
  106. elif self.scoped_session and self.scoped_session().bind:
  107. return self.scoped_session().bind
  108. else:
  109. return None
  110. def persistent_load(self, id_):
  111. m = our_ids.match(str(id_))
  112. if not m:
  113. return None
  114. else:
  115. type_, args = m.group(1, 2)
  116. if type_ == "attribute":
  117. key, clsarg = args.split(":")
  118. cls = pickle.loads(b64decode(clsarg))
  119. return getattr(cls, key)
  120. elif type_ == "mapper":
  121. cls = pickle.loads(b64decode(args))
  122. return class_mapper(cls)
  123. elif type_ == "mapper_selectable":
  124. cls = pickle.loads(b64decode(args))
  125. return class_mapper(cls).__clause_element__()
  126. elif type_ == "mapperprop":
  127. mapper, keyname = args.split(":")
  128. cls = pickle.loads(b64decode(mapper))
  129. return class_mapper(cls).attrs[keyname]
  130. elif type_ == "table":
  131. return self.metadata.tables[args]
  132. elif type_ == "column":
  133. table, colname = args.split(":")
  134. return self.metadata.tables[table].c[colname]
  135. elif type_ == "session":
  136. return self.scoped_session()
  137. elif type_ == "engine":
  138. return self.get_engine()
  139. else:
  140. raise Exception("Unknown token: %s" % type_)
  141. def dumps(obj, protocol=pickle.HIGHEST_PROTOCOL):
  142. buf = BytesIO()
  143. pickler = Serializer(buf, protocol)
  144. pickler.dump(obj)
  145. return buf.getvalue()
  146. def loads(data, metadata=None, scoped_session=None, engine=None):
  147. buf = BytesIO(data)
  148. unpickler = Deserializer(buf, metadata, scoped_session, engine)
  149. return unpickler.load()