set.hpp 37 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317
  1. /*************************************************************************
  2. *
  3. * Copyright 2020 Realm Inc.
  4. *
  5. * Licensed under the Apache License, Version 2.0 (the "License");
  6. * you may not use this file except in compliance with the License.
  7. * You may obtain a copy of the License at
  8. *
  9. * http://www.apache.org/licenses/LICENSE-2.0
  10. *
  11. * Unless required by applicable law or agreed to in writing, software
  12. * distributed under the License is distributed on an "AS IS" BASIS,
  13. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. * See the License for the specific language governing permissions and
  15. * limitations under the License.
  16. *
  17. **************************************************************************/
  18. #ifndef REALM_SET_HPP
  19. #define REALM_SET_HPP
  20. #include <realm/collection.hpp>
  21. #include <realm/bplustree.hpp>
  22. #include <realm/array_key.hpp>
  23. #include <numeric> // std::iota
  24. namespace realm {
  25. class SetBase : public CollectionBase {
  26. public:
  27. using CollectionBase::CollectionBase;
  28. virtual ~SetBase() {}
  29. virtual SetBasePtr clone() const = 0;
  30. virtual std::pair<size_t, bool> insert_null() = 0;
  31. virtual std::pair<size_t, bool> erase_null() = 0;
  32. virtual std::pair<size_t, bool> insert_any(Mixed value) = 0;
  33. virtual std::pair<size_t, bool> erase_any(Mixed value) = 0;
  34. protected:
  35. void insert_repl(Replication* repl, size_t index, Mixed value) const;
  36. void erase_repl(Replication* repl, size_t index, Mixed value) const;
  37. void clear_repl(Replication* repl) const;
  38. static std::vector<Mixed> convert_to_mixed_set(const CollectionBase& rhs);
  39. };
  40. template <class T>
  41. class Set final : public CollectionBaseImpl<SetBase, Set<T>> {
  42. public:
  43. using Base = CollectionBaseImpl<SetBase, Set>;
  44. using value_type = T;
  45. using iterator = CollectionIterator<Set<T>>;
  46. Set() = default;
  47. Set(const Obj& owner, ColKey col_key);
  48. Set(const Set& other);
  49. Set(Set&& other) noexcept;
  50. Set& operator=(const Set& other);
  51. Set& operator=(Set&& other) noexcept;
  52. using Base::operator==;
  53. using Base::operator!=;
  54. SetBasePtr clone() const final
  55. {
  56. return std::make_unique<Set<T>>(*this);
  57. }
  58. T get(size_t ndx) const
  59. {
  60. const auto current_size = size();
  61. CollectionBase::validate_index("get()", ndx, current_size);
  62. return m_tree->get(ndx);
  63. }
  64. iterator begin() const noexcept
  65. {
  66. return iterator{this, 0};
  67. }
  68. iterator end() const noexcept
  69. {
  70. return iterator{this, size()};
  71. }
  72. size_t find_first(const T& value) const
  73. {
  74. return find(value);
  75. }
  76. template <class Func>
  77. void find_all(T value, Func&& func) const
  78. {
  79. size_t found = find(value);
  80. if (found != not_found) {
  81. func(found);
  82. }
  83. }
  84. bool is_subset_of(const CollectionBase&) const;
  85. bool is_strict_subset_of(const CollectionBase& rhs) const;
  86. bool is_superset_of(const CollectionBase& rhs) const;
  87. bool is_strict_superset_of(const CollectionBase& rhs) const;
  88. bool intersects(const CollectionBase& rhs) const;
  89. bool set_equals(const CollectionBase& rhs) const;
  90. void assign_union(const CollectionBase&);
  91. void assign_intersection(const CollectionBase&);
  92. void assign_difference(const CollectionBase&);
  93. void assign_symmetric_difference(const CollectionBase&);
  94. /// Insert a value into the set if it does not already exist, returning the index of the inserted value,
  95. /// or the index of the already-existing value.
  96. std::pair<size_t, bool> insert(T value);
  97. /// Find the index of a value in the set, or `size_t(-1)` if it is not in the set.
  98. size_t find(T value) const;
  99. /// Erase an element from the set, returning true if the set contained the element.
  100. std::pair<size_t, bool> erase(T value);
  101. // Overriding members of CollectionBase:
  102. size_t size() const final;
  103. bool is_null(size_t ndx) const final;
  104. Mixed get_any(size_t ndx) const final
  105. {
  106. return get(ndx);
  107. }
  108. void clear() final;
  109. util::Optional<Mixed> min(size_t* return_ndx = nullptr) const final;
  110. util::Optional<Mixed> max(size_t* return_ndx = nullptr) const final;
  111. util::Optional<Mixed> sum(size_t* return_cnt = nullptr) const final;
  112. util::Optional<Mixed> avg(size_t* return_cnt = nullptr) const final;
  113. std::unique_ptr<CollectionBase> clone_collection() const final
  114. {
  115. return std::make_unique<Set<T>>(*this);
  116. }
  117. void sort(std::vector<size_t>& indices, bool ascending = true) const final;
  118. void distinct(std::vector<size_t>& indices, util::Optional<bool> sort_order = util::none) const final;
  119. // Overriding members of SetBase:
  120. size_t find_any(Mixed) const final;
  121. std::pair<size_t, bool> insert_null() final;
  122. std::pair<size_t, bool> erase_null() final;
  123. std::pair<size_t, bool> insert_any(Mixed value) final;
  124. std::pair<size_t, bool> erase_any(Mixed value) final;
  125. const BPlusTree<T>& get_tree() const
  126. {
  127. return *m_tree;
  128. }
  129. UpdateStatus update_if_needed() const final
  130. {
  131. auto status = Base::update_if_needed();
  132. switch (status) {
  133. case UpdateStatus::Detached: {
  134. m_tree.reset();
  135. return UpdateStatus::Detached;
  136. }
  137. case UpdateStatus::NoChange:
  138. if (m_tree && m_tree->is_attached()) {
  139. return UpdateStatus::NoChange;
  140. }
  141. // The tree has not been initialized yet for this accessor, so
  142. // perform lazy initialization by treating it as an update.
  143. [[fallthrough]];
  144. case UpdateStatus::Updated: {
  145. bool attached = init_from_parent(false);
  146. return attached ? UpdateStatus::Updated : UpdateStatus::Detached;
  147. }
  148. }
  149. REALM_UNREACHABLE();
  150. }
  151. UpdateStatus ensure_created() final
  152. {
  153. auto status = Base::ensure_created();
  154. switch (status) {
  155. case UpdateStatus::Detached:
  156. break; // Not possible (would have thrown earlier).
  157. case UpdateStatus::NoChange: {
  158. if (m_tree && m_tree->is_attached()) {
  159. return UpdateStatus::NoChange;
  160. }
  161. // The tree has not been initialized yet for this accessor, so
  162. // perform lazy initialization by treating it as an update.
  163. [[fallthrough]];
  164. }
  165. case UpdateStatus::Updated: {
  166. bool attached = init_from_parent(true);
  167. REALM_ASSERT(attached);
  168. return attached ? UpdateStatus::Updated : UpdateStatus::Detached;
  169. }
  170. }
  171. REALM_UNREACHABLE();
  172. }
  173. void migrate();
  174. private:
  175. // Friend because it needs access to `m_tree` in the implementation of
  176. // `ObjCollectionBase::get_mutable_tree()`.
  177. friend class LnkSet;
  178. // BPlusTree must be wrapped in an `std::unique_ptr` because it is not
  179. // default-constructible, due to its `Allocator&` member.
  180. mutable std::unique_ptr<BPlusTree<T>> m_tree;
  181. using Base::bump_content_version;
  182. using Base::m_col_key;
  183. using Base::m_nullable;
  184. using Base::m_obj;
  185. bool init_from_parent(bool allow_create) const
  186. {
  187. if (!m_tree) {
  188. m_tree.reset(new BPlusTree<T>(m_obj.get_alloc()));
  189. const ArrayParent* parent = this;
  190. m_tree->set_parent(const_cast<ArrayParent*>(parent), 0);
  191. }
  192. if (m_tree->init_from_parent()) {
  193. // All is well
  194. return true;
  195. }
  196. if (!allow_create) {
  197. return false;
  198. }
  199. // The ref in the column was NULL, create the tree in place.
  200. m_tree->create();
  201. REALM_ASSERT(m_tree->is_attached());
  202. return true;
  203. }
  204. /// Update the accessor and return true if it is attached after the update.
  205. inline bool update() const
  206. {
  207. return update_if_needed() != UpdateStatus::Detached;
  208. }
  209. // `do_` methods here perform the action after preconditions have been
  210. // checked (bounds check, writability, etc.).
  211. void do_insert(size_t ndx, T value);
  212. void do_erase(size_t ndx);
  213. void do_clear();
  214. iterator find_impl(const T& value) const;
  215. template <class It1, class It2>
  216. bool is_subset_of(It1, It2) const;
  217. template <class It1, class It2>
  218. bool is_superset_of(It1, It2) const;
  219. template <class It1, class It2>
  220. bool intersects(It1, It2) const;
  221. template <class It1, class It2>
  222. void assign_union(It1, It2);
  223. template <class It1, class It2>
  224. void assign_intersection(It1, It2);
  225. template <class It1, class It2>
  226. void assign_difference(It1, It2);
  227. template <class It1, class It2>
  228. void assign_symmetric_difference(It1, It2);
  229. static std::vector<T> convert_to_set(const CollectionBase& rhs, bool nullable);
  230. };
  231. class LnkSet final : public ObjCollectionBase<SetBase> {
  232. public:
  233. using Base = ObjCollectionBase<SetBase>;
  234. using value_type = ObjKey;
  235. using iterator = CollectionIterator<LnkSet>;
  236. LnkSet() = default;
  237. LnkSet(const Obj& owner, ColKey col_key)
  238. : m_set(owner, col_key)
  239. {
  240. }
  241. LnkSet(const LnkSet&) = default;
  242. LnkSet(LnkSet&&) = default;
  243. LnkSet& operator=(const LnkSet&) = default;
  244. LnkSet& operator=(LnkSet&&) = default;
  245. bool operator==(const LnkSet& other) const;
  246. bool operator!=(const LnkSet& other) const;
  247. ObjKey get(size_t ndx) const;
  248. size_t find(ObjKey) const;
  249. size_t find_first(ObjKey) const;
  250. std::pair<size_t, bool> insert(ObjKey);
  251. std::pair<size_t, bool> erase(ObjKey);
  252. bool is_subset_of(const CollectionBase&) const;
  253. bool is_strict_subset_of(const CollectionBase& rhs) const;
  254. bool is_superset_of(const CollectionBase& rhs) const;
  255. bool is_strict_superset_of(const CollectionBase& rhs) const;
  256. bool intersects(const CollectionBase& rhs) const;
  257. bool set_equals(const CollectionBase& rhs) const;
  258. void assign_union(const CollectionBase&);
  259. void assign_intersection(const CollectionBase&);
  260. void assign_difference(const CollectionBase&);
  261. void assign_symmetric_difference(const CollectionBase&);
  262. // Overriding members of CollectionBase:
  263. using CollectionBase::get_owner_key;
  264. CollectionBasePtr clone_collection() const
  265. {
  266. return clone_linkset();
  267. }
  268. size_t size() const final;
  269. bool is_null(size_t ndx) const final;
  270. Mixed get_any(size_t ndx) const final;
  271. void clear() final;
  272. util::Optional<Mixed> min(size_t* return_ndx = nullptr) const final;
  273. util::Optional<Mixed> max(size_t* return_ndx = nullptr) const final;
  274. util::Optional<Mixed> sum(size_t* return_cnt = nullptr) const final;
  275. util::Optional<Mixed> avg(size_t* return_cnt = nullptr) const final;
  276. void sort(std::vector<size_t>& indices, bool ascending = true) const final;
  277. void distinct(std::vector<size_t>& indices, util::Optional<bool> sort_order = util::none) const final;
  278. const Obj& get_obj() const noexcept final;
  279. bool is_attached() const final;
  280. bool has_changed() const final;
  281. ColKey get_col_key() const noexcept final;
  282. // Overriding members of SetBase:
  283. SetBasePtr clone() const
  284. {
  285. return clone_linkset();
  286. }
  287. // Overriding members of ObjList:
  288. LinkCollectionPtr clone_obj_list() const final
  289. {
  290. return clone_linkset();
  291. }
  292. size_t find_any(Mixed) const final;
  293. std::pair<size_t, bool> insert_null() final;
  294. std::pair<size_t, bool> erase_null() final;
  295. std::pair<size_t, bool> insert_any(Mixed value) final;
  296. std::pair<size_t, bool> erase_any(Mixed value) final;
  297. // Overriding members of ObjList:
  298. Obj get_object(size_t ndx) const final;
  299. ObjKey get_key(size_t ndx) const final;
  300. // LnkSet interface:
  301. std::unique_ptr<LnkSet> clone_linkset() const
  302. {
  303. // FIXME: The copy constructor requires this.
  304. update_if_needed();
  305. return std::make_unique<LnkSet>(*this);
  306. }
  307. template <class Func>
  308. void find_all(ObjKey value, Func&& func) const
  309. {
  310. if (value.is_unresolved()) {
  311. return;
  312. }
  313. m_set.find_all(value, [&](size_t ndx) {
  314. func(real2virtual(ndx));
  315. });
  316. }
  317. TableView get_sorted_view(SortDescriptor order) const;
  318. TableView get_sorted_view(ColKey column_key, bool ascending = true);
  319. void remove_target_row(size_t link_ndx);
  320. void remove_all_target_rows();
  321. iterator begin() const noexcept
  322. {
  323. return iterator{this, 0};
  324. }
  325. iterator end() const noexcept
  326. {
  327. return iterator{this, size()};
  328. }
  329. private:
  330. Set<ObjKey> m_set;
  331. // Overriding members of ObjCollectionBase:
  332. UpdateStatus do_update_if_needed() const final
  333. {
  334. return m_set.update_if_needed();
  335. }
  336. BPlusTree<ObjKey>* get_mutable_tree() const final
  337. {
  338. return m_set.m_tree.get();
  339. }
  340. };
  341. template <>
  342. void Set<ObjKey>::do_insert(size_t, ObjKey);
  343. template <>
  344. void Set<ObjKey>::do_erase(size_t);
  345. template <>
  346. void Set<ObjKey>::do_clear();
  347. template <>
  348. void Set<ObjLink>::do_insert(size_t, ObjLink);
  349. template <>
  350. void Set<ObjLink>::do_erase(size_t);
  351. template <>
  352. void Set<Mixed>::do_insert(size_t, Mixed);
  353. template <>
  354. void Set<Mixed>::do_erase(size_t);
  355. template <>
  356. void Set<Mixed>::do_clear();
  357. template <>
  358. void Set<Mixed>::migrate();
  359. /// Compare set elements.
  360. ///
  361. /// We cannot use `std::less<>` directly, because the ordering of set elements
  362. /// impacts the file format. For primitive types this is trivial (and can indeed
  363. /// be just `std::less<>`), but for example `Mixed` has specialized comparison
  364. /// that defines equality of numeric types.
  365. template <class T>
  366. struct SetElementLessThan {
  367. bool operator()(const T& a, const T& b) const noexcept
  368. {
  369. // CAUTION: This routine is technically part of the file format, because
  370. // it determines the storage order of Set elements.
  371. return a < b;
  372. }
  373. };
  374. template <class T>
  375. struct SetElementEquals {
  376. bool operator()(const T& a, const T& b) const noexcept
  377. {
  378. // CAUTION: This routine is technically part of the file format, because
  379. // it determines the storage order of Set elements.
  380. return a == b;
  381. }
  382. };
  383. template <>
  384. struct SetElementLessThan<Mixed> {
  385. bool operator()(const Mixed& a, const Mixed& b) const noexcept
  386. {
  387. // CAUTION: This routine is technically part of the file format, because
  388. // it determines the storage order of Set elements.
  389. // These are the rules for comparison of Mixed types in a Set<Mixed>:
  390. // - If both values are null they are equal
  391. // - If only one value is null, that value is lesser than the other
  392. // - All numeric types are compared as the corresponding real numbers
  393. // would compare. So integer 3 equals double 3.
  394. // - String and binary types are compared using lexicographical comparison.
  395. // - All other types are compared using the comparison operators defined
  396. // for the types.
  397. // - If two values have different types, the rank of the types are compared.
  398. // the rank is as follows:
  399. // boolean
  400. // numeric
  401. // string
  402. // binary
  403. // Timestamp
  404. // ObjectId
  405. // UUID
  406. // TypedLink
  407. // Link
  408. //
  409. // The current Mixed::compare function implements these rules except when comparing
  410. // string and binary. If that function is changed we should either implement the rules
  411. // here or upgrade all Set<Mixed> columns.
  412. if (a.is_type(type_String) && b.is_type(type_Binary)) {
  413. return true;
  414. }
  415. if (a.is_type(type_Binary) && b.is_type(type_String)) {
  416. return false;
  417. }
  418. return a.compare(b) < 0;
  419. }
  420. };
  421. template <>
  422. struct SetElementEquals<Mixed> {
  423. bool operator()(const Mixed& a, const Mixed& b) const noexcept
  424. {
  425. // CAUTION: This routine is technically part of the file format, because
  426. // it determines the storage order of Set elements.
  427. // See comments above
  428. if (a.is_type(type_String) && b.is_type(type_Binary)) {
  429. return false;
  430. }
  431. if (a.is_type(type_Binary) && b.is_type(type_String)) {
  432. return false;
  433. }
  434. return a.compare(b) == 0;
  435. }
  436. };
  437. template <class T>
  438. inline Set<T>::Set(const Obj& obj, ColKey col_key)
  439. : Base(obj, col_key)
  440. {
  441. if (!col_key.is_set()) {
  442. throw InvalidArgument(ErrorCodes::TypeMismatch, "Property not a set");
  443. }
  444. check_column_type<value_type>(m_col_key);
  445. }
  446. template <class T>
  447. inline Set<T>::Set(const Set& other)
  448. : Base(static_cast<const Base&>(other))
  449. {
  450. // Reset the content version so we can rely on init_from_parent() being
  451. // called lazily when the accessor is used.
  452. Base::reset_content_version();
  453. }
  454. template <class T>
  455. inline Set<T>::Set(Set&& other) noexcept
  456. : Base(static_cast<Base&&>(other))
  457. , m_tree(std::exchange(other.m_tree, nullptr))
  458. {
  459. if (m_tree) {
  460. m_tree->set_parent(this, 0);
  461. }
  462. }
  463. template <class T>
  464. inline Set<T>& Set<T>::operator=(const Set& other)
  465. {
  466. Base::operator=(static_cast<const Base&>(other));
  467. if (this != &other) {
  468. // Just reset the pointer and rely on init_from_parent() being called
  469. // when the accessor is actually used.
  470. m_tree.reset();
  471. Base::reset_content_version();
  472. }
  473. return *this;
  474. }
  475. template <class T>
  476. inline Set<T>& Set<T>::operator=(Set&& other) noexcept
  477. {
  478. Base::operator=(static_cast<Base&&>(other));
  479. if (this != &other) {
  480. m_tree = std::exchange(other.m_tree, nullptr);
  481. if (m_tree) {
  482. m_tree->set_parent(this, 0);
  483. // Note: We do not need to call reset_content_version(), because we
  484. // took both `m_tree` and `m_content_version` from `other`.
  485. }
  486. }
  487. return *this;
  488. }
  489. template <typename U>
  490. Set<U> Obj::get_set(ColKey col_key) const
  491. {
  492. return Set<U>(*this, col_key);
  493. }
  494. template <typename U>
  495. inline SetPtr<U> Obj::get_set_ptr(ColKey col_key) const
  496. {
  497. return std::make_unique<Set<U>>(*this, col_key);
  498. }
  499. inline LnkSet Obj::get_linkset(ColKey col_key) const
  500. {
  501. return LnkSet{*this, col_key};
  502. }
  503. inline LnkSet Obj::get_linkset(StringData col_name) const
  504. {
  505. return get_linkset(get_column_key(col_name));
  506. }
  507. inline LnkSetPtr Obj::get_linkset_ptr(ColKey col_key) const
  508. {
  509. return std::make_unique<LnkSet>(*this, col_key);
  510. }
  511. template <class T>
  512. size_t Set<T>::find(T value) const
  513. {
  514. auto it = find_impl(value);
  515. if (it != end() && SetElementEquals<T>{}(*it, value)) {
  516. return it.index();
  517. }
  518. return npos;
  519. }
  520. template <class T>
  521. size_t Set<T>::find_any(Mixed value) const
  522. {
  523. if constexpr (std::is_same_v<T, Mixed>) {
  524. return find(value);
  525. }
  526. else {
  527. if (value.is_null()) {
  528. if (!m_nullable) {
  529. return not_found;
  530. }
  531. return find(BPlusTree<T>::default_value(true));
  532. }
  533. else {
  534. return find(value.get<typename util::RemoveOptional<T>::type>());
  535. }
  536. }
  537. }
  538. template <class T>
  539. REALM_NOINLINE auto Set<T>::find_impl(const T& value) const -> iterator
  540. {
  541. auto b = this->begin();
  542. auto e = this->end(); // Note: This ends up calling `update_if_needed()`.
  543. return std::lower_bound(b, e, value, SetElementLessThan<T>{});
  544. }
  545. template <class T>
  546. std::pair<size_t, bool> Set<T>::insert(T value)
  547. {
  548. update_if_needed();
  549. if (value_is_null(value) && !m_nullable)
  550. throw InvalidArgument(ErrorCodes::PropertyNotNullable,
  551. util::format("Set: %1", CollectionBase::get_property_name()));
  552. ensure_created();
  553. auto it = find_impl(value);
  554. if (it != this->end() && SetElementEquals<T>{}(*it, value)) {
  555. return {it.index(), false};
  556. }
  557. if (Replication* repl = m_obj.get_replication()) {
  558. // FIXME: We should emit an instruction regardless of element presence for the purposes of conflict
  559. // resolution in synchronized databases. The reason is that the new insertion may come at a later time
  560. // than an interleaving erase instruction, so emitting the instruction ensures that last "write" wins.
  561. this->insert_repl(repl, it.index(), value);
  562. }
  563. do_insert(it.index(), value);
  564. bump_content_version();
  565. return {it.index(), true};
  566. }
  567. template <class T>
  568. std::pair<size_t, bool> Set<T>::insert_any(Mixed value)
  569. {
  570. if constexpr (std::is_same_v<T, Mixed>) {
  571. return insert(value);
  572. }
  573. else {
  574. if (value.is_null()) {
  575. return insert_null();
  576. }
  577. else {
  578. return insert(value.get<typename util::RemoveOptional<T>::type>());
  579. }
  580. }
  581. }
  582. template <class T>
  583. std::pair<size_t, bool> Set<T>::erase(T value)
  584. {
  585. auto it = find_impl(value); // Note: This ends up calling `update_if_needed()`.
  586. if (it == end() || !SetElementEquals<T>{}(*it, value)) {
  587. return {npos, false};
  588. }
  589. if (Replication* repl = m_obj.get_replication()) {
  590. this->erase_repl(repl, it.index(), value);
  591. }
  592. do_erase(it.index());
  593. bump_content_version();
  594. return {it.index(), true};
  595. }
  596. template <class T>
  597. std::pair<size_t, bool> Set<T>::erase_any(Mixed value)
  598. {
  599. if constexpr (std::is_same_v<T, Mixed>) {
  600. return erase(value);
  601. }
  602. else {
  603. if (value.is_null()) {
  604. return erase_null();
  605. }
  606. else {
  607. return erase(value.get<typename util::RemoveOptional<T>::type>());
  608. }
  609. }
  610. }
  611. template <class T>
  612. inline std::pair<size_t, bool> Set<T>::insert_null()
  613. {
  614. return insert(BPlusTree<T>::default_value(this->m_nullable));
  615. }
  616. template <class T>
  617. std::pair<size_t, bool> Set<T>::erase_null()
  618. {
  619. return erase(BPlusTree<T>::default_value(this->m_nullable));
  620. }
  621. template <class T>
  622. REALM_NOINLINE size_t Set<T>::size() const
  623. {
  624. return update() ? m_tree->size() : 0;
  625. }
  626. template <class T>
  627. inline bool Set<T>::is_null(size_t ndx) const
  628. {
  629. return m_nullable && value_is_null(get(ndx));
  630. }
  631. template <class T>
  632. inline void Set<T>::clear()
  633. {
  634. if (size() > 0) {
  635. if (Replication* repl = this->m_obj.get_replication()) {
  636. this->clear_repl(repl);
  637. }
  638. do_clear();
  639. bump_content_version();
  640. }
  641. }
  642. template <class T>
  643. inline util::Optional<Mixed> Set<T>::min(size_t* return_ndx) const
  644. {
  645. if (update()) {
  646. return MinHelper<T>::eval(*m_tree, return_ndx);
  647. }
  648. return MinHelper<T>::not_found(return_ndx);
  649. }
  650. template <class T>
  651. inline util::Optional<Mixed> Set<T>::max(size_t* return_ndx) const
  652. {
  653. if (update()) {
  654. return MaxHelper<T>::eval(*m_tree, return_ndx);
  655. }
  656. return MaxHelper<T>::not_found(return_ndx);
  657. }
  658. template <class T>
  659. inline util::Optional<Mixed> Set<T>::sum(size_t* return_cnt) const
  660. {
  661. if (update()) {
  662. return SumHelper<T>::eval(*m_tree, return_cnt);
  663. }
  664. return SumHelper<T>::not_found(return_cnt);
  665. }
  666. template <class T>
  667. inline util::Optional<Mixed> Set<T>::avg(size_t* return_cnt) const
  668. {
  669. if (update()) {
  670. return AverageHelper<T>::eval(*m_tree, return_cnt);
  671. }
  672. return AverageHelper<T>::not_found(return_cnt);
  673. }
  674. void set_sorted_indices(size_t sz, std::vector<size_t>& indices, bool ascending);
  675. template <class T>
  676. inline void Set<T>::sort(std::vector<size_t>& indices, bool ascending) const
  677. {
  678. auto sz = size();
  679. set_sorted_indices(sz, indices, ascending);
  680. }
  681. template <>
  682. void Set<Mixed>::sort(std::vector<size_t>& indices, bool ascending) const;
  683. template <class T>
  684. inline void Set<T>::distinct(std::vector<size_t>& indices, util::Optional<bool> sort_order) const
  685. {
  686. auto ascending = !sort_order || *sort_order;
  687. sort(indices, ascending);
  688. }
  689. template <class T>
  690. inline void Set<T>::do_insert(size_t ndx, T value)
  691. {
  692. m_tree->insert(ndx, value);
  693. }
  694. template <class T>
  695. inline void Set<T>::do_erase(size_t ndx)
  696. {
  697. m_tree->erase(ndx);
  698. }
  699. template <class T>
  700. inline void Set<T>::do_clear()
  701. {
  702. m_tree->clear();
  703. }
  704. template <class T>
  705. std::vector<T> Set<T>::convert_to_set(const CollectionBase& rhs, bool nullable)
  706. {
  707. if constexpr (std::is_same_v<T, Mixed>) {
  708. return SetBase::convert_to_mixed_set(rhs);
  709. }
  710. std::vector<Mixed> mixed = SetBase::convert_to_mixed_set(rhs);
  711. std::vector<T> ret;
  712. ret.reserve(mixed.size());
  713. for (auto&& val : mixed) {
  714. if constexpr (std::is_same_v<T, ObjKey>) {
  715. static_cast<void>(nullable);
  716. if (val.is_type(type_Link, type_TypedLink)) {
  717. ret.push_back(val.get<ObjKey>());
  718. }
  719. }
  720. else {
  721. if (val.is_type(ColumnTypeTraits<T>::id)) {
  722. ret.push_back(val.get<T>());
  723. }
  724. else if (val.is_null() && nullable) {
  725. ret.push_back(BPlusTree<T>::default_value(true));
  726. }
  727. }
  728. }
  729. return ret;
  730. }
  731. template <class T>
  732. bool Set<T>::is_subset_of(const CollectionBase& rhs) const
  733. {
  734. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  735. return is_subset_of(other_set->begin(), other_set->end());
  736. }
  737. auto other_set = convert_to_set(rhs, m_nullable);
  738. return is_subset_of(other_set.begin(), other_set.end());
  739. }
  740. template <class T>
  741. template <class It1, class It2>
  742. bool Set<T>::is_subset_of(It1 first, It2 last) const
  743. {
  744. return std::includes(first, last, begin(), end(), SetElementLessThan<T>{});
  745. }
  746. template <class T>
  747. bool Set<T>::is_strict_subset_of(const CollectionBase& rhs) const
  748. {
  749. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  750. return size() != rhs.size() && is_subset_of(other_set->begin(), other_set->end());
  751. }
  752. auto other_set = convert_to_set(rhs, m_nullable);
  753. return size() != other_set.size() && is_subset_of(other_set.begin(), other_set.end());
  754. }
  755. template <class T>
  756. bool Set<T>::is_superset_of(const CollectionBase& rhs) const
  757. {
  758. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  759. return is_superset_of(other_set->begin(), other_set->end());
  760. }
  761. auto other_set = convert_to_set(rhs, m_nullable);
  762. return is_superset_of(other_set.begin(), other_set.end());
  763. }
  764. template <class T>
  765. template <class It1, class It2>
  766. bool Set<T>::is_superset_of(It1 first, It2 last) const
  767. {
  768. return std::includes(begin(), end(), first, last, SetElementLessThan<T>{});
  769. }
  770. template <class T>
  771. bool Set<T>::is_strict_superset_of(const CollectionBase& rhs) const
  772. {
  773. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  774. return size() != rhs.size() && is_superset_of(other_set->begin(), other_set->end());
  775. }
  776. auto other_set = convert_to_set(rhs, m_nullable);
  777. return size() != other_set.size() && is_superset_of(other_set.begin(), other_set.end());
  778. }
  779. template <class T>
  780. bool Set<T>::intersects(const CollectionBase& rhs) const
  781. {
  782. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  783. return intersects(other_set->begin(), other_set->end());
  784. }
  785. auto other_set = convert_to_set(rhs, m_nullable);
  786. return intersects(other_set.begin(), other_set.end());
  787. }
  788. template <class T>
  789. template <class It1, class It2>
  790. bool Set<T>::intersects(It1 first, It2 last) const
  791. {
  792. SetElementLessThan<T> less;
  793. auto it = begin();
  794. while (it != end() && first != last) {
  795. if (less(*it, *first)) {
  796. ++it;
  797. }
  798. else if (less(*first, *it)) {
  799. ++first;
  800. }
  801. else {
  802. return true;
  803. }
  804. }
  805. return false;
  806. }
  807. template <class T>
  808. bool Set<T>::set_equals(const CollectionBase& rhs) const
  809. {
  810. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  811. return size() == rhs.size() && is_subset_of(other_set->begin(), other_set->end());
  812. }
  813. auto other_set = convert_to_set(rhs, m_nullable);
  814. return size() == other_set.size() && is_subset_of(other_set.begin(), other_set.end());
  815. }
  816. template <class T>
  817. inline void Set<T>::assign_union(const CollectionBase& rhs)
  818. {
  819. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  820. return assign_union(other_set->begin(), other_set->end());
  821. }
  822. auto other_set = convert_to_set(rhs, m_nullable);
  823. return assign_union(other_set.begin(), other_set.end());
  824. }
  825. template <class T>
  826. template <class It1, class It2>
  827. void Set<T>::assign_union(It1 first, It2 last)
  828. {
  829. std::vector<T> the_diff;
  830. std::set_difference(first, last, begin(), end(), std::back_inserter(the_diff), SetElementLessThan<T>{});
  831. // 'the_diff' now contains all the elements that are in foreign set, but not in 'this'
  832. // Now insert those elements
  833. for (auto&& value : the_diff) {
  834. insert(value);
  835. }
  836. }
  837. template <class T>
  838. inline void Set<T>::assign_intersection(const CollectionBase& rhs)
  839. {
  840. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  841. return assign_intersection(other_set->begin(), other_set->end());
  842. }
  843. auto other_set = convert_to_set(rhs, m_nullable);
  844. return assign_intersection(other_set.begin(), other_set.end());
  845. }
  846. template <class T>
  847. template <class It1, class It2>
  848. void Set<T>::assign_intersection(It1 first, It2 last)
  849. {
  850. std::vector<T> intersection;
  851. std::set_intersection(first, last, begin(), end(), std::back_inserter(intersection), SetElementLessThan<T>{});
  852. clear();
  853. // Elements in intersection comes from foreign set, so ok to use here
  854. for (auto&& value : intersection) {
  855. insert(value);
  856. }
  857. }
  858. template <class T>
  859. inline void Set<T>::assign_difference(const CollectionBase& rhs)
  860. {
  861. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  862. return assign_difference(other_set->begin(), other_set->end());
  863. }
  864. auto other_set = convert_to_set(rhs, m_nullable);
  865. return assign_difference(other_set.begin(), other_set.end());
  866. }
  867. template <class T>
  868. template <class It1, class It2>
  869. void Set<T>::assign_difference(It1 first, It2 last)
  870. {
  871. std::vector<T> intersection;
  872. std::set_intersection(first, last, begin(), end(), std::back_inserter(intersection), SetElementLessThan<T>{});
  873. // 'intersection' now contains all the elements that are in both foreign set and 'this'.
  874. // Remove those elements. The elements comes from the foreign set, so ok to refer to.
  875. for (auto&& value : intersection) {
  876. erase(value);
  877. }
  878. }
  879. template <class T>
  880. inline void Set<T>::assign_symmetric_difference(const CollectionBase& rhs)
  881. {
  882. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  883. return assign_symmetric_difference(other_set->begin(), other_set->end());
  884. }
  885. auto other_set = convert_to_set(rhs, m_nullable);
  886. return assign_symmetric_difference(other_set.begin(), other_set.end());
  887. }
  888. template <class T>
  889. template <class It1, class It2>
  890. void Set<T>::assign_symmetric_difference(It1 first, It2 last)
  891. {
  892. std::vector<T> difference;
  893. std::set_difference(first, last, begin(), end(), std::back_inserter(difference), SetElementLessThan<T>{});
  894. std::vector<T> intersection;
  895. std::set_intersection(first, last, begin(), end(), std::back_inserter(intersection), SetElementLessThan<T>{});
  896. // Now remove the common elements and add the differences
  897. for (auto&& value : intersection) {
  898. erase(value);
  899. }
  900. for (auto&& value : difference) {
  901. insert(value);
  902. }
  903. }
  904. inline bool LnkSet::operator==(const LnkSet& other) const
  905. {
  906. return m_set == other.m_set;
  907. }
  908. inline bool LnkSet::operator!=(const LnkSet& other) const
  909. {
  910. return m_set != other.m_set;
  911. }
  912. inline ObjKey LnkSet::get(size_t ndx) const
  913. {
  914. const auto current_size = size();
  915. if (ndx >= current_size) {
  916. throw OutOfBounds(util::format("Invalid index into set: %1", CollectionBase::get_property_name()), ndx,
  917. current_size);
  918. }
  919. return m_set.m_tree->get(virtual2real(ndx));
  920. }
  921. inline size_t LnkSet::find(ObjKey value) const
  922. {
  923. if (value.is_unresolved()) {
  924. return not_found;
  925. }
  926. update_if_needed();
  927. size_t ndx = m_set.find(value);
  928. if (ndx == not_found) {
  929. return not_found;
  930. }
  931. return real2virtual(ndx);
  932. }
  933. inline size_t LnkSet::find_first(ObjKey value) const
  934. {
  935. return find(value);
  936. }
  937. inline size_t LnkSet::size() const
  938. {
  939. update_if_needed();
  940. return m_set.size() - num_unresolved();
  941. }
  942. inline std::pair<size_t, bool> LnkSet::insert(ObjKey value)
  943. {
  944. REALM_ASSERT(!value.is_unresolved());
  945. update_if_needed();
  946. auto [ndx, inserted] = m_set.insert(value);
  947. if (inserted) {
  948. update_unresolved(UpdateStatus::Updated);
  949. }
  950. return {real2virtual(ndx), inserted};
  951. }
  952. inline std::pair<size_t, bool> LnkSet::erase(ObjKey value)
  953. {
  954. REALM_ASSERT(!value.is_unresolved());
  955. update_if_needed();
  956. auto [ndx, removed] = m_set.erase(value);
  957. if (removed) {
  958. update_unresolved(UpdateStatus::Updated);
  959. ndx = real2virtual(ndx);
  960. }
  961. return {ndx, removed};
  962. }
  963. inline bool LnkSet::is_null(size_t ndx) const
  964. {
  965. update_if_needed();
  966. return m_set.is_null(virtual2real(ndx));
  967. }
  968. inline Mixed LnkSet::get_any(size_t ndx) const
  969. {
  970. update_if_needed();
  971. auto obj_key = m_set.get(virtual2real(ndx));
  972. return ObjLink{get_target_table()->get_key(), obj_key};
  973. }
  974. inline std::pair<size_t, bool> LnkSet::insert_null()
  975. {
  976. update_if_needed();
  977. auto [ndx, inserted] = m_set.insert_null();
  978. if (inserted) {
  979. update_unresolved(UpdateStatus::Updated);
  980. }
  981. return {real2virtual(ndx), inserted};
  982. }
  983. inline std::pair<size_t, bool> LnkSet::erase_null()
  984. {
  985. update_if_needed();
  986. auto [ndx, erased] = m_set.erase_null();
  987. if (erased) {
  988. update_unresolved(UpdateStatus::Updated);
  989. ndx = real2virtual(ndx);
  990. }
  991. return {ndx, erased};
  992. }
  993. inline std::pair<size_t, bool> LnkSet::insert_any(Mixed value)
  994. {
  995. update_if_needed();
  996. auto [ndx, inserted] = m_set.insert_any(value);
  997. if (inserted) {
  998. update_unresolved(UpdateStatus::Updated);
  999. }
  1000. return {real2virtual(ndx), inserted};
  1001. }
  1002. inline std::pair<size_t, bool> LnkSet::erase_any(Mixed value)
  1003. {
  1004. auto [ndx, erased] = m_set.erase_any(value);
  1005. if (erased) {
  1006. update_unresolved(UpdateStatus::Updated);
  1007. ndx = real2virtual(ndx);
  1008. }
  1009. return {ndx, erased};
  1010. }
  1011. inline void LnkSet::clear()
  1012. {
  1013. // Note: Explicit call to `ensure_writable()` not needed, because we
  1014. // explicitly call `clear_unresolved()`.
  1015. m_set.clear();
  1016. clear_unresolved();
  1017. }
  1018. inline util::Optional<Mixed> LnkSet::min(size_t* return_ndx) const
  1019. {
  1020. update_if_needed();
  1021. size_t found = not_found;
  1022. auto value = m_set.min(&found);
  1023. if (found != not_found && return_ndx) {
  1024. *return_ndx = real2virtual(found);
  1025. }
  1026. return value;
  1027. }
  1028. inline util::Optional<Mixed> LnkSet::max(size_t* return_ndx) const
  1029. {
  1030. update_if_needed();
  1031. size_t found = not_found;
  1032. auto value = m_set.max(&found);
  1033. if (found != not_found && return_ndx) {
  1034. *return_ndx = real2virtual(found);
  1035. }
  1036. return value;
  1037. }
  1038. inline util::Optional<Mixed> LnkSet::sum(size_t* return_cnt) const
  1039. {
  1040. static_cast<void>(return_cnt);
  1041. REALM_TERMINATE("Not implemented");
  1042. }
  1043. inline util::Optional<Mixed> LnkSet::avg(size_t* return_cnt) const
  1044. {
  1045. static_cast<void>(return_cnt);
  1046. REALM_TERMINATE("Not implemented");
  1047. }
  1048. inline void LnkSet::sort(std::vector<size_t>& indices, bool ascending) const
  1049. {
  1050. update_if_needed();
  1051. // Map the input indices to real indices.
  1052. std::transform(indices.begin(), indices.end(), indices.begin(), [this](size_t ndx) {
  1053. return virtual2real(ndx);
  1054. });
  1055. m_set.sort(indices, ascending);
  1056. // Map the output indices to virtual indices.
  1057. std::transform(indices.begin(), indices.end(), indices.begin(), [this](size_t ndx) {
  1058. return real2virtual(ndx);
  1059. });
  1060. }
  1061. inline void LnkSet::distinct(std::vector<size_t>& indices, util::Optional<bool> sort_order) const
  1062. {
  1063. update_if_needed();
  1064. // Map the input indices to real indices.
  1065. std::transform(indices.begin(), indices.end(), indices.begin(), [this](size_t ndx) {
  1066. return virtual2real(ndx);
  1067. });
  1068. m_set.distinct(indices, sort_order);
  1069. // Map the output indices to virtual indices.
  1070. std::transform(indices.begin(), indices.end(), indices.begin(), [this](size_t ndx) {
  1071. return real2virtual(ndx);
  1072. });
  1073. }
  1074. inline const Obj& LnkSet::get_obj() const noexcept
  1075. {
  1076. return m_set.get_obj();
  1077. }
  1078. inline bool LnkSet::is_attached() const
  1079. {
  1080. return m_set.is_attached();
  1081. }
  1082. inline bool LnkSet::has_changed() const
  1083. {
  1084. return m_set.has_changed();
  1085. }
  1086. inline ColKey LnkSet::get_col_key() const noexcept
  1087. {
  1088. return m_set.get_col_key();
  1089. }
  1090. inline size_t LnkSet::find_any(Mixed value) const
  1091. {
  1092. if (value.is_null())
  1093. return not_found;
  1094. const auto type = value.get_type();
  1095. if (type == type_Link) {
  1096. return find(value.get<ObjKey>());
  1097. }
  1098. if (type == type_TypedLink) {
  1099. auto link = value.get_link();
  1100. if (link.get_table_key() == get_target_table()->get_key()) {
  1101. return find(link.get_obj_key());
  1102. }
  1103. }
  1104. return not_found;
  1105. }
  1106. inline Obj LnkSet::get_object(size_t ndx) const
  1107. {
  1108. ObjKey key = get(ndx);
  1109. return get_target_table()->get_object(key);
  1110. }
  1111. inline ObjKey LnkSet::get_key(size_t ndx) const
  1112. {
  1113. return get(ndx);
  1114. }
  1115. inline void LnkSet::assign_union(const CollectionBase& rhs)
  1116. {
  1117. m_set.assign_union(rhs);
  1118. update_unresolved(UpdateStatus::Updated);
  1119. }
  1120. inline void LnkSet::assign_intersection(const CollectionBase& rhs)
  1121. {
  1122. m_set.assign_intersection(rhs);
  1123. update_unresolved(UpdateStatus::Updated);
  1124. }
  1125. inline void LnkSet::assign_difference(const CollectionBase& rhs)
  1126. {
  1127. m_set.assign_difference(rhs);
  1128. update_unresolved(UpdateStatus::Updated);
  1129. }
  1130. inline void LnkSet::assign_symmetric_difference(const CollectionBase& rhs)
  1131. {
  1132. m_set.assign_symmetric_difference(rhs);
  1133. update_unresolved(UpdateStatus::Updated);
  1134. }
  1135. } // namespace realm
  1136. #endif // REALM_SET_HPP