collection.hpp 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667
  1. #ifndef REALM_COLLECTION_HPP
  2. #define REALM_COLLECTION_HPP
  3. #include <realm/obj.hpp>
  4. #include <realm/bplustree.hpp>
  5. #include <realm/obj_list.hpp>
  6. #include <realm/table.hpp>
  7. #include <iosfwd> // std::ostream
  8. #include <type_traits> // std::void_t
  9. namespace realm {
  10. template <class L>
  11. struct CollectionIterator;
  12. class CollectionBase {
  13. public:
  14. virtual ~CollectionBase() {}
  15. /// The size of the collection.
  16. virtual size_t size() const = 0;
  17. /// True if the element at @a ndx is NULL.
  18. virtual bool is_null(size_t ndx) const = 0;
  19. /// Get element at @a ndx as a `Mixed`.
  20. virtual Mixed get_any(size_t ndx) const = 0;
  21. /// Clear the collection.
  22. virtual void clear() = 0;
  23. /// Get the min element, according to whatever comparison function is
  24. /// meaningful for the collection, or none if min is not supported for this type.
  25. virtual util::Optional<Mixed> min(size_t* return_ndx = nullptr) const = 0;
  26. /// Get the max element, according to whatever comparison function is
  27. /// meaningful for the collection, or none if max is not supported for this type.
  28. virtual util::Optional<Mixed> max(size_t* return_ndx = nullptr) const = 0;
  29. /// For collections of arithmetic types, return the sum of all elements.
  30. /// For non arithmetic types, returns none.
  31. virtual util::Optional<Mixed> sum(size_t* return_cnt = nullptr) const = 0;
  32. /// For collections of arithmetic types, return the average of all elements.
  33. /// For non arithmetic types, returns none.
  34. virtual util::Optional<Mixed> avg(size_t* return_cnt = nullptr) const = 0;
  35. /// Produce a clone of the collection accessor referring to the same
  36. /// underlying memory.
  37. virtual std::unique_ptr<CollectionBase> clone_collection() const = 0;
  38. /// Modifies a vector of indices so that they refer to values sorted
  39. /// according to the specified sort order.
  40. virtual void sort(std::vector<size_t>& indices, bool ascending = true) const = 0;
  41. /// Modifies a vector of indices so that they refer to distinct values. If
  42. /// @a sort_order is supplied, the indices will refer to values in sort
  43. /// order, otherwise the indices will be in the same order as they appear in
  44. /// the collection.
  45. virtual void distinct(std::vector<size_t>& indices, util::Optional<bool> sort_order = util::none) const = 0;
  46. // Return index of the first occurrence of 'value'
  47. virtual size_t find_any(Mixed value) const = 0;
  48. /// True if `size()` returns 0.
  49. virtual bool is_empty() const final
  50. {
  51. return size() == 0;
  52. }
  53. /// Get the object that owns this collection.
  54. virtual const Obj& get_obj() const noexcept = 0;
  55. /// Get the column key for this collection.
  56. virtual ColKey get_col_key() const noexcept = 0;
  57. /// Return true if the collection has changed since the last call to
  58. /// `has_changed()`. Note that this function is not idempotent and updates
  59. /// the internal state of the accessor if it has changed.
  60. virtual bool has_changed() const = 0;
  61. /// Returns true if the accessor is in the attached state. By default, this
  62. /// checks if the owning object is still valid.
  63. virtual bool is_attached() const
  64. {
  65. return get_obj().is_valid();
  66. }
  67. // Note: virtual..final prevents static override.
  68. /// Get the key of the object that owns this collection.
  69. virtual ObjKey get_owner_key() const noexcept final
  70. {
  71. return get_obj().get_key();
  72. }
  73. /// Get the table of the object that owns this collection.
  74. virtual ConstTableRef get_table() const noexcept final
  75. {
  76. return get_obj().get_table();
  77. }
  78. /// If this is a collection of links, get the target table.
  79. virtual TableRef get_target_table() const final
  80. {
  81. return get_obj().get_target_table(get_col_key());
  82. }
  83. protected:
  84. friend class Transaction;
  85. CollectionBase() noexcept = default;
  86. CollectionBase(const CollectionBase&) noexcept = default;
  87. CollectionBase(CollectionBase&&) noexcept = default;
  88. CollectionBase& operator=(const CollectionBase&) noexcept = default;
  89. CollectionBase& operator=(CollectionBase&&) noexcept = default;
  90. /// Unconditionally (re)initialize this accessor from its parent (the owner
  91. /// object). May leave the collection detached if the object is no longer
  92. /// valid. Return true if the accessor is attached.
  93. virtual bool init_from_parent() const = 0;
  94. /// If the underlying memory has changed, update this accessor to reflect
  95. /// the new state. Returns true if the accessor was actually updated.
  96. virtual bool update_if_needed() const = 0;
  97. };
  98. template <class T>
  99. inline void check_column_type(ColKey col)
  100. {
  101. if (col && col.get_type() != ColumnTypeTraits<T>::column_id) {
  102. throw LogicError(LogicError::collection_type_mismatch);
  103. }
  104. }
  105. template <>
  106. inline void check_column_type<Int>(ColKey col)
  107. {
  108. if (col && (col.get_type() != col_type_Int || col.get_attrs().test(col_attr_Nullable))) {
  109. throw LogicError(LogicError::collection_type_mismatch);
  110. }
  111. }
  112. template <>
  113. inline void check_column_type<util::Optional<Int>>(ColKey col)
  114. {
  115. if (col && (col.get_type() != col_type_Int || !col.get_attrs().test(col_attr_Nullable))) {
  116. throw LogicError(LogicError::collection_type_mismatch);
  117. }
  118. }
  119. template <>
  120. inline void check_column_type<ObjKey>(ColKey col)
  121. {
  122. if (col) {
  123. bool is_link_list = (col.get_type() == col_type_LinkList);
  124. bool is_link_set = (col.is_set() && col.get_type() == col_type_Link);
  125. if (!(is_link_list || is_link_set))
  126. throw LogicError(LogicError::collection_type_mismatch);
  127. }
  128. }
  129. template <class T, class = void>
  130. struct MinHelper {
  131. template <class U>
  132. static util::Optional<Mixed> eval(U&, size_t*) noexcept
  133. {
  134. return util::none;
  135. }
  136. };
  137. template <class T>
  138. struct MinHelper<T, std::void_t<ColumnMinMaxType<T>>> {
  139. template <class U>
  140. static util::Optional<Mixed> eval(U& tree, size_t* return_ndx)
  141. {
  142. auto optional_min = bptree_minimum<T>(tree, return_ndx);
  143. if (optional_min) {
  144. return Mixed{*optional_min};
  145. }
  146. return Mixed{};
  147. }
  148. };
  149. template <class T, class Enable = void>
  150. struct MaxHelper {
  151. template <class U>
  152. static util::Optional<Mixed> eval(U&, size_t*) noexcept
  153. {
  154. return util::none;
  155. }
  156. };
  157. template <class T>
  158. struct MaxHelper<T, std::void_t<ColumnMinMaxType<T>>> {
  159. template <class U>
  160. static util::Optional<Mixed> eval(U& tree, size_t* return_ndx)
  161. {
  162. auto optional_max = bptree_maximum<T>(tree, return_ndx);
  163. if (optional_max) {
  164. return Mixed{*optional_max};
  165. }
  166. return Mixed{};
  167. }
  168. };
  169. template <class T, class Enable = void>
  170. class SumHelper {
  171. public:
  172. template <class U>
  173. static util::Optional<Mixed> eval(U&, size_t* return_cnt) noexcept
  174. {
  175. if (return_cnt)
  176. *return_cnt = 0;
  177. return util::none;
  178. }
  179. };
  180. template <class T>
  181. class SumHelper<T, std::void_t<ColumnSumType<T>>> {
  182. public:
  183. template <class U>
  184. static util::Optional<Mixed> eval(U& tree, size_t* return_cnt)
  185. {
  186. return Mixed{bptree_sum<T>(tree, return_cnt)};
  187. }
  188. };
  189. template <class T, class = void>
  190. struct AverageHelper {
  191. template <class U>
  192. static util::Optional<Mixed> eval(U&, size_t* return_cnt) noexcept
  193. {
  194. if (return_cnt)
  195. *return_cnt = 0;
  196. return util::none;
  197. }
  198. };
  199. template <class T>
  200. struct AverageHelper<T, std::void_t<ColumnSumType<T>>> {
  201. template <class U>
  202. static util::Optional<Mixed> eval(U& tree, size_t* return_cnt)
  203. {
  204. size_t count = 0;
  205. auto result = Mixed{bptree_average<T>(tree, &count)};
  206. if (return_cnt) {
  207. *return_cnt = count;
  208. }
  209. return count == 0 ? util::none : result;
  210. }
  211. };
  212. /// Convenience base class for collections, which implements most of the
  213. /// relevant interfaces for a collection that is bound to an object accessor and
  214. /// representable as a BPlusTree<T>.
  215. template <class Interface>
  216. class CollectionBaseImpl : public Interface, protected ArrayParent {
  217. public:
  218. static_assert(std::is_base_of_v<CollectionBase, Interface>);
  219. // Overriding members of CollectionBase:
  220. ColKey get_col_key() const noexcept final
  221. {
  222. return m_col_key;
  223. }
  224. const Obj& get_obj() const noexcept final
  225. {
  226. return m_obj;
  227. }
  228. bool has_changed() const final
  229. {
  230. update_if_needed();
  231. if (m_last_content_version != m_content_version) {
  232. m_last_content_version = m_content_version;
  233. return true;
  234. }
  235. return false;
  236. }
  237. using Interface::get_owner_key;
  238. using Interface::get_table;
  239. using Interface::get_target_table;
  240. protected:
  241. Obj m_obj;
  242. ColKey m_col_key;
  243. bool m_nullable = false;
  244. mutable uint_fast64_t m_content_version = 0;
  245. mutable uint_fast64_t m_last_content_version = 0;
  246. mutable bool m_valid = false;
  247. CollectionBaseImpl() = default;
  248. CollectionBaseImpl(const CollectionBaseImpl& other) = default;
  249. CollectionBaseImpl(CollectionBaseImpl&& other) = default;
  250. CollectionBaseImpl(const Obj& obj, ColKey col_key) noexcept
  251. : m_obj(obj)
  252. , m_col_key(col_key)
  253. , m_nullable(col_key.is_nullable())
  254. {
  255. }
  256. CollectionBaseImpl& operator=(const CollectionBaseImpl& other) = default;
  257. CollectionBaseImpl& operator=(CollectionBaseImpl&& other) = default;
  258. bool operator==(const CollectionBaseImpl& other) const noexcept
  259. {
  260. return get_table() == other.get_table() && get_owner_key() == other.get_owner_key() &&
  261. get_col_key() == other.get_col_key();
  262. }
  263. bool operator!=(const CollectionBaseImpl& other) const noexcept
  264. {
  265. return !(*this == other);
  266. }
  267. // Overriding members of CollectionBase:
  268. REALM_NOINLINE bool update_if_needed() const final
  269. {
  270. if (!m_obj.is_valid())
  271. return false;
  272. auto content_version = m_obj.get_alloc().get_content_version();
  273. if (m_obj.update_if_needed() || content_version != m_content_version) {
  274. this->init_from_parent();
  275. return true;
  276. }
  277. return false;
  278. }
  279. void update_content_version() const noexcept
  280. {
  281. m_content_version = m_obj.get_alloc().get_content_version();
  282. }
  283. void bump_content_version()
  284. {
  285. m_content_version = m_obj.bump_content_version();
  286. }
  287. void ensure_writeable()
  288. {
  289. if (m_obj.ensure_writeable()) {
  290. this->init_from_parent();
  291. }
  292. }
  293. protected:
  294. // Overriding ArrayParent interface:
  295. ref_type get_child_ref(size_t child_ndx) const noexcept final
  296. {
  297. static_cast<void>(child_ndx);
  298. try {
  299. return to_ref(m_obj._get<int64_t>(m_col_key.get_index()));
  300. }
  301. catch (const KeyNotFound&) {
  302. return ref_type(0);
  303. }
  304. }
  305. void update_child_ref(size_t child_ndx, ref_type new_ref) final
  306. {
  307. static_cast<void>(child_ndx);
  308. m_obj.set_int(m_col_key, from_ref(new_ref));
  309. }
  310. };
  311. namespace _impl {
  312. /// Translate from condensed index to uncondensed index in collections that hide
  313. /// tombstones.
  314. size_t virtual2real(const std::vector<size_t>& vec, size_t ndx) noexcept;
  315. /// Translate from uncondensed index to condensed into in collections that hide
  316. /// tombstones.
  317. size_t real2virtual(const std::vector<size_t>& vec, size_t ndx) noexcept;
  318. /// Rebuild the list of unresolved keys for tombstone handling.
  319. void update_unresolved(std::vector<size_t>& vec, const BPlusTree<ObjKey>* tree);
  320. /// Clear the context flag on the tree if there are no more unresolved links.
  321. void check_for_last_unresolved(BPlusTree<ObjKey>* tree);
  322. /// Proxy class needed because the ObjList interface clobbers method names from
  323. /// CollectionBase.
  324. struct ObjListProxy : ObjList {
  325. virtual TableRef proxy_get_target_table() const = 0;
  326. TableRef get_target_table() const final
  327. {
  328. return proxy_get_target_table();
  329. }
  330. };
  331. } // namespace _impl
  332. /// Base class for collections of objects, where unresolved links (tombstones)
  333. /// can occur.
  334. template <class Interface>
  335. class ObjCollectionBase : public Interface, public _impl::ObjListProxy {
  336. public:
  337. static_assert(std::is_base_of_v<CollectionBase, Interface>);
  338. using Interface::get_col_key;
  339. using Interface::get_obj;
  340. using Interface::get_table;
  341. using Interface::is_attached;
  342. using Interface::size;
  343. // Overriding methods in ObjList:
  344. void get_dependencies(TableVersions& versions) const final
  345. {
  346. if (is_attached()) {
  347. auto table = this->get_table();
  348. versions.emplace_back(table->get_key(), table->get_content_version());
  349. }
  350. }
  351. void sync_if_needed() const final
  352. {
  353. if (is_attached()) {
  354. update_if_needed();
  355. }
  356. }
  357. bool is_in_sync() const noexcept final
  358. {
  359. return true;
  360. }
  361. bool has_unresolved() const noexcept
  362. {
  363. return m_unresolved.size() != 0;
  364. }
  365. using Interface::get_target_table;
  366. protected:
  367. ObjCollectionBase() = default;
  368. ObjCollectionBase(const ObjCollectionBase&) = default;
  369. ObjCollectionBase(ObjCollectionBase&&) = default;
  370. ObjCollectionBase& operator=(const ObjCollectionBase&) = default;
  371. ObjCollectionBase& operator=(ObjCollectionBase&&) = default;
  372. /// Implementations should call `update_if_needed()` on their inner accessor
  373. /// (without `update_unresolved()`).
  374. virtual bool do_update_if_needed() const = 0;
  375. /// Implementations should call `init_from_parent()` on their inner accessor
  376. /// (without `update_unresolved()`).
  377. virtual bool do_init_from_parent() const = 0;
  378. /// Implementations should return a non-const reference to their internal
  379. /// `BPlusTree<T>`.
  380. virtual BPlusTree<ObjKey>* get_mutable_tree() const = 0;
  381. /// Calls `do_init_from_parent()` and updates the list of unresolved links.
  382. bool init_from_parent() const final
  383. {
  384. clear_unresolved();
  385. bool valid = do_init_from_parent();
  386. if (valid) {
  387. update_unresolved();
  388. }
  389. return valid;
  390. }
  391. /// Implements update_if_needed() in a way that ensures the consistency of
  392. /// the unresolved list. Derived classes should call this instead of calling
  393. /// `update_if_needed()` on their inner accessor.
  394. bool update_if_needed() const final
  395. {
  396. bool updated = do_update_if_needed();
  397. update_unresolved();
  398. return updated;
  399. }
  400. /// Translate from condensed index to uncondensed.
  401. size_t virtual2real(size_t ndx) const noexcept
  402. {
  403. return _impl::virtual2real(m_unresolved, ndx);
  404. }
  405. /// Translate from uncondensed index to condensed.
  406. size_t real2virtual(size_t ndx) const noexcept
  407. {
  408. return _impl::real2virtual(m_unresolved, ndx);
  409. }
  410. /// Rebuild the list of tombstones if there is a chance that it has changed.
  411. void update_unresolved() const
  412. {
  413. const auto& obj = this->get_obj();
  414. if (obj.is_valid()) {
  415. auto content_version = this->get_obj().get_alloc().get_content_version();
  416. if (content_version != m_content_version) {
  417. _impl::update_unresolved(m_unresolved, get_mutable_tree());
  418. m_content_version = content_version;
  419. }
  420. }
  421. else {
  422. clear_unresolved();
  423. }
  424. }
  425. void check_for_last_unresolved()
  426. {
  427. _impl::check_for_last_unresolved(get_mutable_tree());
  428. }
  429. /// Clear the list of tombstones. It will be rebuilt the next time
  430. /// `update_if_needed()` is called.
  431. void clear_unresolved() const noexcept
  432. {
  433. m_unresolved.clear();
  434. m_content_version = uint_fast64_t(-1);
  435. }
  436. /// Return the number of tombstones.
  437. size_t num_unresolved() const noexcept
  438. {
  439. return m_unresolved.size();
  440. }
  441. private:
  442. // Sorted set of indices containing unresolved links.
  443. mutable std::vector<size_t> m_unresolved;
  444. // We need to track the content version separately to keep the list of
  445. // unresolved indices up to date, and can't rely on the return value of
  446. // `do_update_if_needed()`, because the inner accessor may have been
  447. // refreshed without our knowledge.
  448. mutable uint_fast64_t m_content_version = uint_fast64_t(-1);
  449. TableRef proxy_get_target_table() const final
  450. {
  451. return Interface::get_target_table();
  452. }
  453. bool matches(const ObjList& other) const final
  454. {
  455. return get_owning_obj().get_key() == other.get_owning_obj().get_key() &&
  456. get_owning_col_key() == other.get_owning_col_key();
  457. }
  458. Obj get_owning_obj() const final
  459. {
  460. return get_obj();
  461. }
  462. ColKey get_owning_col_key() const final
  463. {
  464. return get_col_key();
  465. }
  466. };
  467. /// Random-access iterator over elements of a collection.
  468. ///
  469. /// Values are cached into a member variable in order to support `operator->`
  470. /// and `operator*` returning a pointer and a reference, respectively.
  471. template <class L>
  472. struct CollectionIterator {
  473. using iterator_category = std::random_access_iterator_tag;
  474. using value_type = typename L::value_type;
  475. using difference_type = ptrdiff_t;
  476. using pointer = const value_type*;
  477. using reference = const value_type&;
  478. CollectionIterator(const L* l, size_t ndx) noexcept
  479. : m_list(l)
  480. , m_ndx(ndx)
  481. {
  482. }
  483. pointer operator->() const
  484. {
  485. m_val = m_list->get(m_ndx);
  486. return &m_val;
  487. }
  488. reference operator*() const
  489. {
  490. return *operator->();
  491. }
  492. CollectionIterator& operator++() noexcept
  493. {
  494. ++m_ndx;
  495. return *this;
  496. }
  497. CollectionIterator operator++(int) noexcept
  498. {
  499. auto tmp = *this;
  500. operator++();
  501. return tmp;
  502. }
  503. CollectionIterator& operator--() noexcept
  504. {
  505. --m_ndx;
  506. return *this;
  507. }
  508. CollectionIterator operator--(int) noexcept
  509. {
  510. auto tmp = *this;
  511. operator--();
  512. return tmp;
  513. }
  514. CollectionIterator& operator+=(ptrdiff_t n) noexcept
  515. {
  516. m_ndx += n;
  517. return *this;
  518. }
  519. CollectionIterator& operator-=(ptrdiff_t n) noexcept
  520. {
  521. m_ndx -= n;
  522. return *this;
  523. }
  524. friend ptrdiff_t operator-(const CollectionIterator& lhs, const CollectionIterator& rhs) noexcept
  525. {
  526. return ptrdiff_t(lhs.m_ndx) - ptrdiff_t(rhs.m_ndx);
  527. }
  528. friend CollectionIterator operator+(CollectionIterator lhs, ptrdiff_t rhs) noexcept
  529. {
  530. lhs.m_ndx += rhs;
  531. return lhs;
  532. }
  533. friend CollectionIterator operator+(ptrdiff_t lhs, CollectionIterator rhs) noexcept
  534. {
  535. return rhs + lhs;
  536. }
  537. bool operator!=(const CollectionIterator& rhs) const noexcept
  538. {
  539. REALM_ASSERT_DEBUG(m_list == rhs.m_list);
  540. return m_ndx != rhs.m_ndx;
  541. }
  542. bool operator==(const CollectionIterator& rhs) const noexcept
  543. {
  544. REALM_ASSERT_DEBUG(m_list == rhs.m_list);
  545. return m_ndx == rhs.m_ndx;
  546. }
  547. size_t index() const noexcept
  548. {
  549. return m_ndx;
  550. }
  551. private:
  552. mutable value_type m_val;
  553. const L* m_list;
  554. size_t m_ndx = size_t(-1);
  555. };
  556. } // namespace realm
  557. #endif // REALM_COLLECTION_HPP