node.hpp 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383
  1. /*************************************************************************
  2. *
  3. * Copyright 2018 Realm Inc.
  4. *
  5. * Licensed under the Apache License, Version 2.0 (the "License");
  6. * you may not use this file except in compliance with the License.
  7. * You may obtain a copy of the License at
  8. *
  9. * http://www.apache.org/licenses/LICENSE-2.0
  10. *
  11. * Unless required by applicable law or agreed to in writing, software
  12. * distributed under the License is distributed on an "AS IS" BASIS,
  13. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. * See the License for the specific language governing permissions and
  15. * limitations under the License.
  16. *
  17. **************************************************************************/
  18. #ifndef REALM_NODE_HPP
  19. #define REALM_NODE_HPP
  20. #include <realm/node_header.hpp>
  21. #include <realm/alloc.hpp>
  22. namespace realm {
  23. class Mixed;
  24. /// Special index value. It has various meanings depending on
  25. /// context. It is returned by some search functions to indicate 'not
  26. /// found'. It is similar in function to std::string::npos.
  27. const size_t npos = size_t(-1);
  28. /// Alias for realm::npos.
  29. const size_t not_found = npos;
  30. /// All accessor classes that logically contains other objects must inherit
  31. /// this class.
  32. ///
  33. /// A database node accessor contains information about the parent of the
  34. /// referenced node. This 'reverse' reference is not explicitly present in the
  35. /// underlying node hierarchy, but it is needed when modifying an array. A
  36. /// modification may lead to relocation of the underlying array node, and the
  37. /// parent must be updated accordingly. Since this applies recursivly all the
  38. /// way to the root node, it is essential that the entire chain of parent
  39. /// accessors is constructed and propperly maintained when a particular array is
  40. /// modified.
  41. class ArrayParent {
  42. public:
  43. virtual ~ArrayParent() noexcept {}
  44. virtual ref_type get_child_ref(size_t child_ndx) const noexcept = 0;
  45. virtual void update_child_ref(size_t child_ndx, ref_type new_ref) = 0;
  46. };
  47. /// Provides access to individual array nodes of the database.
  48. ///
  49. /// This class serves purely as an accessor, it assumes no ownership of the
  50. /// referenced memory.
  51. ///
  52. /// An node accessor can be in one of two states: attached or unattached. It is
  53. /// in the attached state if, and only if is_attached() returns true. Most
  54. /// non-static member functions of this class have undefined behaviour if the
  55. /// accessor is in the unattached state. The exceptions are: is_attached(),
  56. /// detach(), create(), init_from_ref(), init_from_mem(), init_from_parent(),
  57. /// has_parent(), get_parent(), set_parent(), get_ndx_in_parent(),
  58. /// set_ndx_in_parent(), adjust_ndx_in_parent(), and get_ref_from_parent().
  59. ///
  60. /// An node accessor contains information about the parent of the referenced
  61. /// node. This 'reverse' reference is not explicitly present in the
  62. /// underlying node hierarchy, but it is needed when modifying a node. A
  63. /// modification may lead to relocation of the underlying node, and the
  64. /// parent must be updated accordingly. Since this applies recursively all the
  65. /// way to the root node, it is essential that the entire chain of parent
  66. /// accessors is constructed and properly maintained when a particular node is
  67. /// modified.
  68. ///
  69. /// The parent reference (`pointer to parent`, `index in parent`) is updated
  70. /// independently from the state of attachment to an underlying node. In
  71. /// particular, the parent reference remains valid and is unaffected by changes
  72. /// in attachment. These two aspects of the state of the accessor is updated
  73. /// independently, and it is entirely the responsibility of the caller to update
  74. /// them such that they are consistent with the underlying node hierarchy before
  75. /// calling any method that modifies the underlying node.
  76. ///
  77. /// FIXME: This class currently has fragments of ownership, in particular the
  78. /// constructors that allocate underlying memory. On the other hand, the
  79. /// destructor never frees the memory. This is a problematic situation, because
  80. /// it so easily becomes an obscure source of leaks. There are three options for
  81. /// a fix of which the third is most attractive but hardest to implement: (1)
  82. /// Remove all traces of ownership semantics, that is, remove the constructors
  83. /// that allocate memory, but keep the trivial copy constructor. For this to
  84. /// work, it is important that the constness of the accessor has nothing to do
  85. /// with the constness of the underlying memory, otherwise constness can be
  86. /// violated simply by copying the accessor. (2) Disallov copying but associate
  87. /// the constness of the accessor with the constness of the underlying
  88. /// memory. (3) Provide full ownership semantics like is done for Table
  89. /// accessors, and provide a proper copy constructor that really produces a copy
  90. /// of the node. For this to work, the class should assume ownership if, and
  91. /// only if there is no parent. A copy produced by a copy constructor will not
  92. /// have a parent. Even if the original was part of a database, the copy will be
  93. /// free-standing, that is, not be part of any database. For intra, or inter
  94. /// database copying, one would have to also specify the target allocator.
  95. class Node : public NodeHeader {
  96. public:
  97. // FIXME: Should not be public
  98. char* m_data = nullptr; // Points to first byte after header
  99. /*********************** Constructor / destructor ************************/
  100. // The object will not be fully initialized when using this constructor
  101. explicit Node(Allocator& allocator) noexcept
  102. : m_alloc(allocator)
  103. {
  104. }
  105. virtual ~Node() {}
  106. /**************************** Initializers *******************************/
  107. /// Same as init_from_ref(ref_type) but avoid the mapping of 'ref' to memory
  108. /// pointer.
  109. char* init_from_mem(MemRef mem) noexcept
  110. {
  111. char* header = mem.get_addr();
  112. m_ref = mem.get_ref();
  113. m_data = get_data_from_header(header);
  114. m_size = get_size_from_header(header);
  115. return header;
  116. }
  117. /************************** access functions *****************************/
  118. bool is_attached() const noexcept
  119. {
  120. return m_data != nullptr;
  121. }
  122. inline bool is_read_only() const noexcept
  123. {
  124. REALM_ASSERT_DEBUG(is_attached());
  125. return m_alloc.is_read_only(m_ref);
  126. }
  127. size_t size() const noexcept
  128. {
  129. REALM_ASSERT_DEBUG(is_attached());
  130. return m_size;
  131. }
  132. bool is_empty() const noexcept
  133. {
  134. return size() == 0;
  135. }
  136. ref_type get_ref() const noexcept
  137. {
  138. return m_ref;
  139. }
  140. MemRef get_mem() const noexcept
  141. {
  142. return MemRef(get_header_from_data(m_data), m_ref, m_alloc);
  143. }
  144. Allocator& get_alloc() const noexcept
  145. {
  146. return m_alloc;
  147. }
  148. /// Get the address of the header of this array.
  149. char* get_header() const noexcept
  150. {
  151. return get_header_from_data(m_data);
  152. }
  153. bool has_parent() const noexcept
  154. {
  155. return m_parent != nullptr;
  156. }
  157. ArrayParent* get_parent() const noexcept
  158. {
  159. return m_parent;
  160. }
  161. size_t get_ndx_in_parent() const noexcept
  162. {
  163. return m_ndx_in_parent;
  164. }
  165. bool has_missing_parent_update() const noexcept
  166. {
  167. return m_missing_parent_update;
  168. }
  169. /// Get the ref of this array as known to the parent. The caller must ensure
  170. /// that the parent information ('pointer to parent' and 'index in parent')
  171. /// is correct before calling this function.
  172. ref_type get_ref_from_parent() const noexcept
  173. {
  174. REALM_ASSERT_DEBUG(m_parent);
  175. ref_type ref = m_parent->get_child_ref(m_ndx_in_parent);
  176. return ref;
  177. }
  178. /***************************** modifiers *********************************/
  179. /// Detach from the underlying array node. This method has no effect if the
  180. /// accessor is currently unattached (idempotency).
  181. void detach() noexcept
  182. {
  183. m_data = nullptr;
  184. }
  185. /// Destroy only the array that this accessor is attached to, not the
  186. /// children of that array. See non-static destroy_deep() for an
  187. /// alternative. If this accessor is already in the detached state, this
  188. /// function has no effect (idempotency).
  189. void destroy() noexcept
  190. {
  191. if (!is_attached())
  192. return;
  193. char* header = get_header_from_data(m_data);
  194. m_alloc.free_(m_ref, header);
  195. m_data = nullptr;
  196. }
  197. /// Shorthand for `destroy(MemRef(ref, alloc), alloc)`.
  198. static void destroy(ref_type ref, Allocator& alloc) noexcept
  199. {
  200. destroy(MemRef(ref, alloc), alloc);
  201. }
  202. /// Destroy only the specified array node, not its children. See also
  203. /// destroy_deep(MemRef, Allocator&).
  204. static void destroy(MemRef mem, Allocator& alloc) noexcept
  205. {
  206. alloc.free_(mem);
  207. }
  208. /// Setting a new parent affects ownership of the attached array node, if
  209. /// any. If a non-null parent is specified, and there was no parent
  210. /// originally, then the caller passes ownership to the parent, and vice
  211. /// versa. This assumes, of course, that the change in parentship reflects a
  212. /// corresponding change in the list of children in the affected parents.
  213. void set_parent(ArrayParent* parent, size_t ndx_in_parent) noexcept
  214. {
  215. m_parent = parent;
  216. m_ndx_in_parent = ndx_in_parent;
  217. }
  218. void set_ndx_in_parent(size_t ndx) noexcept
  219. {
  220. m_ndx_in_parent = ndx;
  221. }
  222. void clear_missing_parent_update()
  223. {
  224. m_missing_parent_update = false;
  225. }
  226. /// Update the parents reference to this child. This requires, of course,
  227. /// that the parent information stored in this child is up to date. If the
  228. /// parent pointer is set to null, this function has no effect.
  229. void update_parent()
  230. {
  231. if (m_parent) {
  232. m_parent->update_child_ref(m_ndx_in_parent, m_ref);
  233. }
  234. else {
  235. m_missing_parent_update = true;
  236. }
  237. }
  238. protected:
  239. /// The total size in bytes (including the header) of a new empty
  240. /// array. Must be a multiple of 8 (i.e., 64-bit aligned).
  241. static const size_t initial_capacity = 128;
  242. size_t m_ref;
  243. Allocator& m_alloc;
  244. size_t m_size = 0; // Number of elements currently stored.
  245. #if REALM_ENABLE_MEMDEBUG
  246. // If m_no_relocation is false, then copy_on_write() will always relocate this array, regardless if it's
  247. // required or not. If it's true, then it will never relocate, which is currently only expeted inside
  248. // GroupWriter::write_group() due to a unique chicken/egg problem (see description there).
  249. bool m_no_relocation = false;
  250. #endif
  251. void alloc(size_t init_size, size_t new_width);
  252. void copy_on_write()
  253. {
  254. #if REALM_ENABLE_MEMDEBUG
  255. // We want to relocate this array regardless if there is a need or not, in order to catch use-after-free bugs.
  256. // Only exception is inside GroupWriter::write_group() (see explanation at the definition of the
  257. // m_no_relocation
  258. // member)
  259. if (!m_no_relocation) {
  260. #else
  261. if (is_read_only()) {
  262. #endif
  263. do_copy_on_write();
  264. }
  265. }
  266. void copy_on_write(size_t min_size)
  267. {
  268. #if REALM_ENABLE_MEMDEBUG
  269. // We want to relocate this array regardless if there is a need or not, in order to catch use-after-free bugs.
  270. // Only exception is inside GroupWriter::write_group() (see explanation at the definition of the
  271. // m_no_relocation
  272. // member)
  273. if (!m_no_relocation) {
  274. #else
  275. if (is_read_only()) {
  276. #endif
  277. do_copy_on_write(min_size);
  278. }
  279. }
  280. void ensure_size(size_t min_size)
  281. {
  282. char* header = get_header_from_data(m_data);
  283. size_t orig_capacity_bytes = get_capacity_from_header(header);
  284. if (orig_capacity_bytes < min_size) {
  285. do_copy_on_write(min_size);
  286. }
  287. }
  288. static MemRef create_node(size_t size, Allocator& alloc, bool context_flag = false, Type type = type_Normal,
  289. WidthType width_type = wtype_Ignore, int width = 1);
  290. void set_header_size(size_t value) noexcept
  291. {
  292. set_size_in_header(value, get_header());
  293. }
  294. // Includes array header. Not necessarily 8-byte aligned.
  295. virtual size_t calc_byte_len(size_t num_items, size_t width) const;
  296. virtual size_t calc_item_count(size_t bytes, size_t width) const noexcept;
  297. static void init_header(char* header, bool is_inner_bptree_node, bool has_refs, bool context_flag,
  298. WidthType width_type, int width, size_t size, size_t capacity) noexcept;
  299. private:
  300. friend class NodeTree;
  301. ArrayParent* m_parent = nullptr;
  302. size_t m_ndx_in_parent = 0; // Ignored if m_parent is null.
  303. bool m_missing_parent_update = false;
  304. void do_copy_on_write(size_t minimum_size = 0);
  305. };
  306. class Spec;
  307. class Mixed;
  308. /// Base class for all nodes holding user data
  309. class ArrayPayload {
  310. public:
  311. virtual ~ArrayPayload();
  312. virtual void init_from_ref(ref_type) noexcept = 0;
  313. virtual void set_parent(ArrayParent* parent, size_t ndx_in_parent) noexcept = 0;
  314. virtual Mixed get_any(size_t ndx) const = 0;
  315. virtual bool need_spec() const
  316. {
  317. return false;
  318. }
  319. virtual void set_spec(Spec*, size_t) const {}
  320. };
  321. inline void Node::init_header(char* header, bool is_inner_bptree_node, bool has_refs, bool context_flag,
  322. WidthType width_type, int width, size_t size, size_t capacity) noexcept
  323. {
  324. // Note: Since the header layout contains unallocated bit and/or
  325. // bytes, it is important that we put the entire header into a
  326. // well defined state initially.
  327. std::fill(header, header + header_size, 0);
  328. set_is_inner_bptree_node_in_header(is_inner_bptree_node, header);
  329. set_hasrefs_in_header(has_refs, header);
  330. set_context_flag_in_header(context_flag, header);
  331. set_wtype_in_header(width_type, header);
  332. set_width_in_header(width, header);
  333. set_size_in_header(size, header);
  334. set_capacity_in_header(capacity, header);
  335. }
  336. } // namespace realm
  337. #endif /* REALM_NODE_HPP */