set.hpp 33 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229
  1. /*************************************************************************
  2. *
  3. * Copyright 2020 Realm Inc.
  4. *
  5. * Licensed under the Apache License, Version 2.0 (the "License");
  6. * you may not use this file except in compliance with the License.
  7. * You may obtain a copy of the License at
  8. *
  9. * http://www.apache.org/licenses/LICENSE-2.0
  10. *
  11. * Unless required by applicable law or agreed to in writing, software
  12. * distributed under the License is distributed on an "AS IS" BASIS,
  13. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. * See the License for the specific language governing permissions and
  15. * limitations under the License.
  16. *
  17. **************************************************************************/
  18. #ifndef REALM_SET_HPP
  19. #define REALM_SET_HPP
  20. #include <realm/collection.hpp>
  21. #include <realm/bplustree.hpp>
  22. #include <realm/array_key.hpp>
  23. #include <numeric> // std::iota
  24. #include <set>
  25. namespace realm {
  26. class SetBase : public CollectionBase {
  27. public:
  28. using CollectionBase::CollectionBase;
  29. virtual ~SetBase() {}
  30. virtual SetBasePtr clone() const = 0;
  31. virtual std::pair<size_t, bool> insert_null() = 0;
  32. virtual std::pair<size_t, bool> erase_null() = 0;
  33. virtual std::pair<size_t, bool> insert_any(Mixed value) = 0;
  34. virtual std::pair<size_t, bool> erase_any(Mixed value) = 0;
  35. protected:
  36. void insert_repl(Replication* repl, size_t index, Mixed value) const;
  37. void erase_repl(Replication* repl, size_t index, Mixed value) const;
  38. void clear_repl(Replication* repl) const;
  39. };
  40. template <class T>
  41. class Set final : public CollectionBaseImpl<SetBase> {
  42. public:
  43. using Base = CollectionBaseImpl<SetBase>;
  44. using value_type = T;
  45. using iterator = CollectionIterator<Set<T>>;
  46. Set() = default;
  47. Set(const Obj& owner, ColKey col_key);
  48. Set(const Set& other);
  49. Set(Set&& other) noexcept;
  50. Set& operator=(const Set& other);
  51. Set& operator=(Set&& other) noexcept;
  52. using Base::operator==;
  53. using Base::operator!=;
  54. SetBasePtr clone() const final
  55. {
  56. return std::make_unique<Set<T>>(*this);
  57. }
  58. T get(size_t ndx) const
  59. {
  60. const auto current_size = size();
  61. if (ndx >= current_size) {
  62. throw std::out_of_range("Index out of range");
  63. }
  64. return m_tree->get(ndx);
  65. }
  66. iterator begin() const noexcept
  67. {
  68. return iterator{this, 0};
  69. }
  70. iterator end() const noexcept
  71. {
  72. return iterator{this, size()};
  73. }
  74. size_t find_first(const T& value) const
  75. {
  76. return find(value);
  77. }
  78. template <class Func>
  79. void find_all(T value, Func&& func) const
  80. {
  81. size_t found = find(value);
  82. if (found != not_found) {
  83. func(found);
  84. }
  85. }
  86. bool is_subset_of(const CollectionBase&) const;
  87. bool is_strict_subset_of(const CollectionBase& rhs) const;
  88. bool is_superset_of(const CollectionBase& rhs) const;
  89. bool is_strict_superset_of(const CollectionBase& rhs) const;
  90. bool intersects(const CollectionBase& rhs) const;
  91. bool set_equals(const CollectionBase& rhs) const;
  92. void assign_union(const CollectionBase&);
  93. void assign_intersection(const CollectionBase&);
  94. void assign_difference(const CollectionBase&);
  95. void assign_symmetric_difference(const CollectionBase&);
  96. /// Insert a value into the set if it does not already exist, returning the index of the inserted value,
  97. /// or the index of the already-existing value.
  98. std::pair<size_t, bool> insert(T value);
  99. /// Find the index of a value in the set, or `size_t(-1)` if it is not in the set.
  100. size_t find(T value) const;
  101. /// Erase an element from the set, returning true if the set contained the element.
  102. std::pair<size_t, bool> erase(T value);
  103. // Overriding members of CollectionBase:
  104. size_t size() const final;
  105. bool is_null(size_t ndx) const final;
  106. Mixed get_any(size_t ndx) const final
  107. {
  108. return get(ndx);
  109. }
  110. void clear() final;
  111. util::Optional<Mixed> min(size_t* return_ndx = nullptr) const final;
  112. util::Optional<Mixed> max(size_t* return_ndx = nullptr) const final;
  113. util::Optional<Mixed> sum(size_t* return_cnt = nullptr) const final;
  114. util::Optional<Mixed> avg(size_t* return_cnt = nullptr) const final;
  115. std::unique_ptr<CollectionBase> clone_collection() const final
  116. {
  117. return std::make_unique<Set<T>>(*this);
  118. }
  119. void sort(std::vector<size_t>& indices, bool ascending = true) const final;
  120. void distinct(std::vector<size_t>& indices, util::Optional<bool> sort_order = util::none) const final;
  121. // Overriding members of SetBase:
  122. size_t find_any(Mixed) const final;
  123. std::pair<size_t, bool> insert_null() final;
  124. std::pair<size_t, bool> erase_null() final;
  125. std::pair<size_t, bool> insert_any(Mixed value) final;
  126. std::pair<size_t, bool> erase_any(Mixed value) final;
  127. const BPlusTree<T>& get_tree() const
  128. {
  129. return *m_tree;
  130. }
  131. private:
  132. friend class LnkSet;
  133. mutable std::unique_ptr<BPlusTree<T>> m_tree;
  134. using Base::m_col_key;
  135. using Base::m_obj;
  136. using Base::m_valid;
  137. void create()
  138. {
  139. m_tree->create();
  140. m_valid = true;
  141. }
  142. REALM_NOINLINE bool init_from_parent() const final
  143. {
  144. m_valid = m_tree->init_from_parent();
  145. update_content_version();
  146. return m_valid;
  147. }
  148. REALM_NOINLINE void ensure_created()
  149. {
  150. if (!m_valid && m_obj.is_valid()) {
  151. create();
  152. }
  153. }
  154. void do_insert(size_t ndx, T value);
  155. void do_erase(size_t ndx);
  156. void do_clear();
  157. iterator find_impl(const T& value) const;
  158. template <class It1, class It2>
  159. bool is_subset_of(It1, It2) const;
  160. template <class It1, class It2>
  161. bool is_superset_of(It1, It2) const;
  162. template <class It1, class It2>
  163. bool intersects(It1, It2) const;
  164. template <class It1, class It2>
  165. void assign_union(It1, It2);
  166. template <class It1, class It2>
  167. void assign_intersection(It1, It2);
  168. template <class It1, class It2>
  169. void assign_difference(It1, It2);
  170. template <class It1, class It2>
  171. void assign_symmetric_difference(It1, It2);
  172. };
  173. class LnkSet final : public ObjCollectionBase<SetBase> {
  174. public:
  175. using Base = ObjCollectionBase<SetBase>;
  176. using value_type = ObjKey;
  177. using iterator = CollectionIterator<LnkSet>;
  178. LnkSet() = default;
  179. LnkSet(const Obj& owner, ColKey col_key)
  180. : m_set(owner, col_key)
  181. {
  182. update_unresolved();
  183. }
  184. LnkSet(const LnkSet&) = default;
  185. LnkSet(LnkSet&&) = default;
  186. LnkSet& operator=(const LnkSet&) = default;
  187. LnkSet& operator=(LnkSet&&) = default;
  188. bool operator==(const LnkSet& other) const;
  189. bool operator!=(const LnkSet& other) const;
  190. ObjKey get(size_t ndx) const;
  191. size_t find(ObjKey) const;
  192. size_t find_first(ObjKey) const;
  193. std::pair<size_t, bool> insert(ObjKey);
  194. std::pair<size_t, bool> erase(ObjKey);
  195. bool is_subset_of(const CollectionBase&) const;
  196. bool is_strict_subset_of(const CollectionBase& rhs) const;
  197. bool is_superset_of(const CollectionBase& rhs) const;
  198. bool is_strict_superset_of(const CollectionBase& rhs) const;
  199. bool intersects(const CollectionBase& rhs) const;
  200. bool set_equals(const CollectionBase& rhs) const;
  201. void assign_union(const CollectionBase&);
  202. void assign_intersection(const CollectionBase&);
  203. void assign_difference(const CollectionBase&);
  204. void assign_symmetric_difference(const CollectionBase&);
  205. // Overriding members of CollectionBase:
  206. using CollectionBase::get_owner_key;
  207. CollectionBasePtr clone_collection() const
  208. {
  209. return clone_linkset();
  210. }
  211. size_t size() const final;
  212. bool is_null(size_t ndx) const final;
  213. Mixed get_any(size_t ndx) const final;
  214. void clear() final;
  215. util::Optional<Mixed> min(size_t* return_ndx = nullptr) const final;
  216. util::Optional<Mixed> max(size_t* return_ndx = nullptr) const final;
  217. util::Optional<Mixed> sum(size_t* return_cnt = nullptr) const final;
  218. util::Optional<Mixed> avg(size_t* return_cnt = nullptr) const final;
  219. void sort(std::vector<size_t>& indices, bool ascending = true) const final;
  220. void distinct(std::vector<size_t>& indices, util::Optional<bool> sort_order = util::none) const final;
  221. const Obj& get_obj() const noexcept final;
  222. bool is_attached() const final;
  223. bool has_changed() const final;
  224. ColKey get_col_key() const noexcept final;
  225. // Overriding members of SetBase:
  226. SetBasePtr clone() const
  227. {
  228. return clone_linkset();
  229. }
  230. // Overriding members of ObjList:
  231. LinkCollectionPtr clone_obj_list() const final
  232. {
  233. return clone_linkset();
  234. }
  235. size_t find_any(Mixed) const final;
  236. std::pair<size_t, bool> insert_null() final;
  237. std::pair<size_t, bool> erase_null() final;
  238. std::pair<size_t, bool> insert_any(Mixed value) final;
  239. std::pair<size_t, bool> erase_any(Mixed value) final;
  240. // Overriding members of ObjList:
  241. bool is_obj_valid(size_t) const noexcept final;
  242. Obj get_object(size_t ndx) const final;
  243. ObjKey get_key(size_t ndx) const final;
  244. // LnkSet interface:
  245. std::unique_ptr<LnkSet> clone_linkset() const
  246. {
  247. // FIXME: The copy constructor requires this.
  248. update_if_needed();
  249. return std::make_unique<LnkSet>(*this);
  250. }
  251. template <class Func>
  252. void find_all(ObjKey value, Func&& func) const
  253. {
  254. if (value.is_unresolved()) {
  255. return;
  256. }
  257. m_set.find_all(value, [&](size_t ndx) {
  258. func(real2virtual(ndx));
  259. });
  260. }
  261. TableView get_sorted_view(SortDescriptor order) const;
  262. TableView get_sorted_view(ColKey column_key, bool ascending = true);
  263. void remove_target_row(size_t link_ndx);
  264. void remove_all_target_rows();
  265. iterator begin() const noexcept
  266. {
  267. return iterator{this, 0};
  268. }
  269. iterator end() const noexcept
  270. {
  271. return iterator{this, size()};
  272. }
  273. private:
  274. Set<ObjKey> m_set;
  275. bool do_update_if_needed() const final
  276. {
  277. return m_set.update_if_needed();
  278. }
  279. bool do_init_from_parent() const final
  280. {
  281. return m_set.init_from_parent();
  282. }
  283. BPlusTree<ObjKey>* get_mutable_tree() const final
  284. {
  285. return m_set.m_tree.get();
  286. }
  287. };
  288. template <>
  289. void Set<ObjKey>::do_insert(size_t, ObjKey);
  290. template <>
  291. void Set<ObjKey>::do_erase(size_t);
  292. template <>
  293. void Set<ObjKey>::do_clear();
  294. template <>
  295. void Set<ObjLink>::do_insert(size_t, ObjLink);
  296. template <>
  297. void Set<ObjLink>::do_erase(size_t);
  298. template <>
  299. void Set<Mixed>::do_insert(size_t, Mixed);
  300. template <>
  301. void Set<Mixed>::do_erase(size_t);
  302. template <>
  303. void Set<Mixed>::do_clear();
  304. /// Compare set elements.
  305. ///
  306. /// We cannot use `std::less<>` directly, because the ordering of set elements
  307. /// impacts the file format. For primitive types this is trivial (and can indeed
  308. /// be just `std::less<>`), but for example `Mixed` has specialized comparison
  309. /// that defines equality of numeric types.
  310. template <class T>
  311. struct SetElementLessThan {
  312. bool operator()(const T& a, const T& b) const noexcept
  313. {
  314. // CAUTION: This routine is technically part of the file format, because
  315. // it determines the storage order of Set elements.
  316. return a < b;
  317. }
  318. };
  319. template <class T>
  320. struct SetElementEquals {
  321. bool operator()(const T& a, const T& b) const noexcept
  322. {
  323. // CAUTION: This routine is technically part of the file format, because
  324. // it determines the storage order of Set elements.
  325. return a == b;
  326. }
  327. };
  328. template <>
  329. struct SetElementLessThan<Mixed> {
  330. bool operator()(const Mixed& a, const Mixed& b) const noexcept
  331. {
  332. // CAUTION: This routine is technically part of the file format, because
  333. // it determines the storage order of Set elements.
  334. // These are the rules for comparison of Mixed types in a Set<Mixed>:
  335. // - If both values are null they are equal
  336. // - If only one value is null, that value is lesser than the other
  337. // - All numeric types are compared as the corresponding real numbers
  338. // would compare. So integer 3 equals double 3.
  339. // - String and binary types are compared using lexicographical comparison.
  340. // - All other types are compared using the comparison operators defined
  341. // for the types.
  342. // - If two values have different types, the rank of the types are compared.
  343. // the rank is as follows:
  344. // boolean
  345. // numeric
  346. // string/binary
  347. // Timestamp
  348. // ObjectId
  349. // UUID
  350. // TypedLink
  351. // Link
  352. //
  353. // The current Mixed::compare_utf8 function implements these rules. If that
  354. // function is changed we should either implement the rules here or
  355. // upgrade all Set<Mixed> columns.
  356. return a.compare(b) < 0;
  357. }
  358. };
  359. template <>
  360. struct SetElementEquals<Mixed> {
  361. bool operator()(const Mixed& a, const Mixed& b) const noexcept
  362. {
  363. // CAUTION: This routine is technically part of the file format, because
  364. // it determines the storage order of Set elements.
  365. // See comments above
  366. return a.compare(b) == 0;
  367. }
  368. };
  369. template <class T>
  370. inline Set<T>::Set(const Obj& obj, ColKey col_key)
  371. : Base(obj, col_key)
  372. , m_tree(new BPlusTree<value_type>(obj.get_alloc()))
  373. {
  374. if (!col_key.is_set()) {
  375. throw LogicError(LogicError::collection_type_mismatch);
  376. }
  377. check_column_type<value_type>(m_col_key);
  378. m_tree->set_parent(this, 0); // ndx not used, implicit in m_owner
  379. if (m_obj) {
  380. // Fine because init_from_parent() is final.
  381. this->init_from_parent();
  382. }
  383. }
  384. template <class T>
  385. inline Set<T>::Set(const Set& other)
  386. : Base(static_cast<const Base&>(other))
  387. {
  388. // FIXME: If the other side needed an update, we could be using a stale ref
  389. // below.
  390. REALM_ASSERT(!other.update_if_needed());
  391. if (other.m_tree) {
  392. Allocator& alloc = other.m_tree->get_alloc();
  393. m_tree = std::make_unique<BPlusTree<T>>(alloc);
  394. m_tree->set_parent(this, 0);
  395. if (m_valid)
  396. m_tree->init_from_ref(other.m_tree->get_ref());
  397. }
  398. }
  399. template <class T>
  400. inline Set<T>::Set(Set&& other) noexcept
  401. : Base(static_cast<Base&&>(other))
  402. , m_tree(std::exchange(other.m_tree, nullptr))
  403. {
  404. if (m_tree) {
  405. m_tree->set_parent(this, 0);
  406. }
  407. }
  408. template <class T>
  409. inline Set<T>& Set<T>::operator=(const Set& other)
  410. {
  411. Base::operator=(static_cast<const Base&>(other));
  412. if (this != &other) {
  413. m_tree.reset();
  414. if (other.m_tree) {
  415. Allocator& alloc = other.m_tree->get_alloc();
  416. m_tree = std::make_unique<BPlusTree<T>>(alloc);
  417. m_tree->set_parent(this, 0);
  418. if (m_valid) {
  419. m_tree->init_from_ref(other.m_tree->get_ref());
  420. }
  421. }
  422. }
  423. return *this;
  424. }
  425. template <class T>
  426. inline Set<T>& Set<T>::operator=(Set&& other) noexcept
  427. {
  428. Base::operator=(static_cast<Base&&>(other));
  429. if (this != &other) {
  430. m_tree = std::exchange(other.m_tree, nullptr);
  431. if (m_tree) {
  432. m_tree->set_parent(this, 0);
  433. }
  434. }
  435. return *this;
  436. }
  437. template <typename U>
  438. Set<U> Obj::get_set(ColKey col_key) const
  439. {
  440. return Set<U>(*this, col_key);
  441. }
  442. template <typename U>
  443. inline SetPtr<U> Obj::get_set_ptr(ColKey col_key) const
  444. {
  445. return std::make_unique<Set<U>>(*this, col_key);
  446. }
  447. inline LnkSet Obj::get_linkset(ColKey col_key) const
  448. {
  449. return LnkSet{*this, col_key};
  450. }
  451. inline LnkSetPtr Obj::get_linkset_ptr(ColKey col_key) const
  452. {
  453. return std::make_unique<LnkSet>(*this, col_key);
  454. }
  455. template <class T>
  456. size_t Set<T>::find(T value) const
  457. {
  458. auto it = find_impl(value);
  459. if (it != end() && SetElementEquals<T>{}(*it, value)) {
  460. return it.index();
  461. }
  462. return npos;
  463. }
  464. template <class T>
  465. size_t Set<T>::find_any(Mixed value) const
  466. {
  467. if constexpr (std::is_same_v<T, Mixed>) {
  468. return find(value);
  469. }
  470. else {
  471. if (value.is_null()) {
  472. if (!m_nullable) {
  473. return not_found;
  474. }
  475. return find(BPlusTree<T>::default_value(true));
  476. }
  477. else {
  478. return find(value.get<typename util::RemoveOptional<T>::type>());
  479. }
  480. }
  481. }
  482. template <class T>
  483. REALM_NOINLINE auto Set<T>::find_impl(const T& value) const -> iterator
  484. {
  485. auto b = this->begin();
  486. auto e = this->end();
  487. return std::lower_bound(b, e, value, SetElementLessThan<T>{});
  488. }
  489. template <class T>
  490. std::pair<size_t, bool> Set<T>::insert(T value)
  491. {
  492. update_if_needed();
  493. if (value_is_null(value) && !m_nullable)
  494. throw LogicError(LogicError::column_not_nullable);
  495. ensure_created();
  496. this->ensure_writeable();
  497. auto it = find_impl(value);
  498. if (it != this->end() && SetElementEquals<T>{}(*it, value)) {
  499. return {it.index(), false};
  500. }
  501. if (Replication* repl = m_obj.get_replication()) {
  502. // FIXME: We should emit an instruction regardless of element presence for the purposes of conflict
  503. // resolution in synchronized databases. The reason is that the new insertion may come at a later time
  504. // than an interleaving erase instruction, so emitting the instruction ensures that last "write" wins.
  505. this->insert_repl(repl, it.index(), value);
  506. }
  507. do_insert(it.index(), value);
  508. bump_content_version();
  509. return {it.index(), true};
  510. }
  511. template <class T>
  512. std::pair<size_t, bool> Set<T>::insert_any(Mixed value)
  513. {
  514. if constexpr (std::is_same_v<T, Mixed>) {
  515. return insert(value);
  516. }
  517. else {
  518. if (value.is_null()) {
  519. return insert_null();
  520. }
  521. else {
  522. return insert(value.get<typename util::RemoveOptional<T>::type>());
  523. }
  524. }
  525. }
  526. template <class T>
  527. std::pair<size_t, bool> Set<T>::erase(T value)
  528. {
  529. update_if_needed();
  530. this->ensure_writeable();
  531. auto it = find_impl(value);
  532. if (it == end() || !SetElementEquals<T>{}(*it, value)) {
  533. return {npos, false};
  534. }
  535. if (Replication* repl = m_obj.get_replication()) {
  536. this->erase_repl(repl, it.index(), value);
  537. }
  538. do_erase(it.index());
  539. bump_content_version();
  540. return {it.index(), true};
  541. }
  542. template <class T>
  543. std::pair<size_t, bool> Set<T>::erase_any(Mixed value)
  544. {
  545. if constexpr (std::is_same_v<T, Mixed>) {
  546. return erase(value);
  547. }
  548. else {
  549. if (value.is_null()) {
  550. return erase_null();
  551. }
  552. else {
  553. return erase(value.get<typename util::RemoveOptional<T>::type>());
  554. }
  555. }
  556. }
  557. template <class T>
  558. inline std::pair<size_t, bool> Set<T>::insert_null()
  559. {
  560. return insert(BPlusTree<T>::default_value(this->m_nullable));
  561. }
  562. template <class T>
  563. std::pair<size_t, bool> Set<T>::erase_null()
  564. {
  565. return erase(BPlusTree<T>::default_value(this->m_nullable));
  566. }
  567. template <class T>
  568. REALM_NOINLINE size_t Set<T>::size() const
  569. {
  570. if (!is_attached())
  571. return 0;
  572. update_if_needed();
  573. if (!m_valid) {
  574. return 0;
  575. }
  576. return m_tree->size();
  577. }
  578. template <class T>
  579. inline bool Set<T>::is_null(size_t ndx) const
  580. {
  581. return m_nullable && value_is_null(get(ndx));
  582. }
  583. template <class T>
  584. inline void Set<T>::clear()
  585. {
  586. ensure_created();
  587. update_if_needed();
  588. this->ensure_writeable();
  589. if (size() > 0) {
  590. if (Replication* repl = this->m_obj.get_replication()) {
  591. this->clear_repl(repl);
  592. }
  593. do_clear();
  594. bump_content_version();
  595. }
  596. }
  597. template <class T>
  598. inline util::Optional<Mixed> Set<T>::min(size_t* return_ndx) const
  599. {
  600. update_if_needed();
  601. return MinHelper<T>::eval(*m_tree, return_ndx);
  602. }
  603. template <class T>
  604. inline util::Optional<Mixed> Set<T>::max(size_t* return_ndx) const
  605. {
  606. update_if_needed();
  607. return MaxHelper<T>::eval(*m_tree, return_ndx);
  608. }
  609. template <class T>
  610. inline util::Optional<Mixed> Set<T>::sum(size_t* return_cnt) const
  611. {
  612. update_if_needed();
  613. return SumHelper<T>::eval(*m_tree, return_cnt);
  614. }
  615. template <class T>
  616. inline util::Optional<Mixed> Set<T>::avg(size_t* return_cnt) const
  617. {
  618. update_if_needed();
  619. return AverageHelper<T>::eval(*m_tree, return_cnt);
  620. }
  621. void set_sorted_indices(size_t sz, std::vector<size_t>& indices, bool ascending);
  622. template <class T>
  623. inline void Set<T>::sort(std::vector<size_t>& indices, bool ascending) const
  624. {
  625. auto sz = size();
  626. set_sorted_indices(sz, indices, ascending);
  627. }
  628. template <class T>
  629. inline void Set<T>::distinct(std::vector<size_t>& indices, util::Optional<bool> sort_order) const
  630. {
  631. auto ascending = !sort_order || *sort_order;
  632. sort(indices, ascending);
  633. }
  634. template <class T>
  635. inline void Set<T>::do_insert(size_t ndx, T value)
  636. {
  637. m_tree->insert(ndx, value);
  638. }
  639. template <class T>
  640. inline void Set<T>::do_erase(size_t ndx)
  641. {
  642. m_tree->erase(ndx);
  643. }
  644. template <class T>
  645. inline void Set<T>::do_clear()
  646. {
  647. m_tree->clear();
  648. }
  649. namespace {
  650. template <class T>
  651. auto convert_to_set(const CollectionBase& rhs, bool nullable)
  652. {
  653. std::set<T, SetElementLessThan<T>> ret;
  654. for (size_t i = 0; i < rhs.size(); i++) {
  655. auto val = rhs.get_any(i);
  656. if constexpr (std::is_same_v<T, Mixed>) {
  657. ret.emplace(val);
  658. }
  659. else {
  660. if (val.is_type(ColumnTypeTraits<T>::id)) {
  661. ret.emplace(val.get<T>());
  662. }
  663. else if (val.is_null() && nullable) {
  664. ret.emplace(BPlusTree<T>::default_value(true));
  665. }
  666. }
  667. }
  668. return ret;
  669. }
  670. } // namespace
  671. template <class T>
  672. bool Set<T>::is_subset_of(const CollectionBase& rhs) const
  673. {
  674. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  675. return is_subset_of(other_set->begin(), other_set->end());
  676. }
  677. auto other_set = convert_to_set<T>(rhs, m_nullable);
  678. return is_subset_of(other_set.begin(), other_set.end());
  679. }
  680. template <class T>
  681. template <class It1, class It2>
  682. bool Set<T>::is_subset_of(It1 first, It2 last) const
  683. {
  684. return std::includes(first, last, begin(), end(), SetElementLessThan<T>{});
  685. }
  686. template <class T>
  687. bool Set<T>::is_strict_subset_of(const CollectionBase& rhs) const
  688. {
  689. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  690. return size() != rhs.size() && is_subset_of(other_set->begin(), other_set->end());
  691. }
  692. auto other_set = convert_to_set<T>(rhs, m_nullable);
  693. return size() != other_set.size() && is_subset_of(other_set.begin(), other_set.end());
  694. }
  695. template <class T>
  696. bool Set<T>::is_superset_of(const CollectionBase& rhs) const
  697. {
  698. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  699. return is_superset_of(other_set->begin(), other_set->end());
  700. }
  701. auto other_set = convert_to_set<T>(rhs, m_nullable);
  702. return is_superset_of(other_set.begin(), other_set.end());
  703. }
  704. template <class T>
  705. template <class It1, class It2>
  706. bool Set<T>::is_superset_of(It1 first, It2 last) const
  707. {
  708. return std::includes(begin(), end(), first, last, SetElementLessThan<T>{});
  709. }
  710. template <class T>
  711. bool Set<T>::is_strict_superset_of(const CollectionBase& rhs) const
  712. {
  713. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  714. return size() != rhs.size() && is_superset_of(other_set->begin(), other_set->end());
  715. }
  716. auto other_set = convert_to_set<T>(rhs, m_nullable);
  717. return size() != other_set.size() && is_superset_of(other_set.begin(), other_set.end());
  718. }
  719. template <class T>
  720. bool Set<T>::intersects(const CollectionBase& rhs) const
  721. {
  722. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  723. return intersects(other_set->begin(), other_set->end());
  724. }
  725. auto other_set = convert_to_set<T>(rhs, m_nullable);
  726. return intersects(other_set.begin(), other_set.end());
  727. }
  728. template <class T>
  729. template <class It1, class It2>
  730. bool Set<T>::intersects(It1 first, It2 last) const
  731. {
  732. SetElementLessThan<T> less;
  733. auto it = begin();
  734. while (it != end() && first != last) {
  735. if (less(*it, *first)) {
  736. ++it;
  737. }
  738. else if (less(*first, *it)) {
  739. ++first;
  740. }
  741. else {
  742. return true;
  743. }
  744. }
  745. return false;
  746. }
  747. template <class T>
  748. bool Set<T>::set_equals(const CollectionBase& rhs) const
  749. {
  750. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  751. return size() == rhs.size() && is_subset_of(other_set->begin(), other_set->end());
  752. }
  753. auto other_set = convert_to_set<T>(rhs, m_nullable);
  754. return size() == other_set.size() && is_subset_of(other_set.begin(), other_set.end());
  755. }
  756. template <class T>
  757. inline void Set<T>::assign_union(const CollectionBase& rhs)
  758. {
  759. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  760. return assign_union(other_set->begin(), other_set->end());
  761. }
  762. auto other_set = convert_to_set<T>(rhs, m_nullable);
  763. return assign_union(other_set.begin(), other_set.end());
  764. }
  765. template <class T>
  766. template <class It1, class It2>
  767. void Set<T>::assign_union(It1 first, It2 last)
  768. {
  769. std::vector<T> the_diff;
  770. std::set_difference(first, last, begin(), end(), std::back_inserter(the_diff), SetElementLessThan<T>{});
  771. // 'the_diff' now contains all the elements that are in foreign set, but not in 'this'
  772. // Now insert those elements
  773. for (auto value : the_diff) {
  774. insert(value);
  775. }
  776. }
  777. template <class T>
  778. inline void Set<T>::assign_intersection(const CollectionBase& rhs)
  779. {
  780. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  781. return assign_intersection(other_set->begin(), other_set->end());
  782. }
  783. auto other_set = convert_to_set<T>(rhs, m_nullable);
  784. return assign_intersection(other_set.begin(), other_set.end());
  785. }
  786. template <class T>
  787. template <class It1, class It2>
  788. void Set<T>::assign_intersection(It1 first, It2 last)
  789. {
  790. std::vector<T> intersection;
  791. std::set_intersection(first, last, begin(), end(), std::back_inserter(intersection), SetElementLessThan<T>{});
  792. clear();
  793. // Elements in intersection comes from foreign set, so ok to use here
  794. for (auto value : intersection) {
  795. insert(value);
  796. }
  797. }
  798. template <class T>
  799. inline void Set<T>::assign_difference(const CollectionBase& rhs)
  800. {
  801. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  802. return assign_difference(other_set->begin(), other_set->end());
  803. }
  804. auto other_set = convert_to_set<T>(rhs, m_nullable);
  805. return assign_difference(other_set.begin(), other_set.end());
  806. }
  807. template <class T>
  808. template <class It1, class It2>
  809. void Set<T>::assign_difference(It1 first, It2 last)
  810. {
  811. std::vector<T> intersection;
  812. std::set_intersection(first, last, begin(), end(), std::back_inserter(intersection), SetElementLessThan<T>{});
  813. // 'intersection' now contains all the elements that are in both foreign set and 'this'.
  814. // Remove those elements. The elements comes from the foreign set, so ok to refer to.
  815. for (auto value : intersection) {
  816. erase(value);
  817. }
  818. }
  819. template <class T>
  820. inline void Set<T>::assign_symmetric_difference(const CollectionBase& rhs)
  821. {
  822. if (auto other_set = dynamic_cast<const Set<T>*>(&rhs)) {
  823. return assign_symmetric_difference(other_set->begin(), other_set->end());
  824. }
  825. auto other_set = convert_to_set<T>(rhs, m_nullable);
  826. return assign_symmetric_difference(other_set.begin(), other_set.end());
  827. }
  828. template <class T>
  829. template <class It1, class It2>
  830. void Set<T>::assign_symmetric_difference(It1 first, It2 last)
  831. {
  832. std::vector<T> difference;
  833. std::set_difference(first, last, begin(), end(), std::back_inserter(difference), SetElementLessThan<T>{});
  834. std::vector<T> intersection;
  835. std::set_intersection(first, last, begin(), end(), std::back_inserter(intersection), SetElementLessThan<T>{});
  836. // Now remove the common elements and add the differences
  837. for (auto value : intersection) {
  838. erase(value);
  839. }
  840. for (auto value : difference) {
  841. insert(value);
  842. }
  843. }
  844. inline bool LnkSet::operator==(const LnkSet& other) const
  845. {
  846. return m_set == other.m_set;
  847. }
  848. inline bool LnkSet::operator!=(const LnkSet& other) const
  849. {
  850. return m_set != other.m_set;
  851. }
  852. inline ObjKey LnkSet::get(size_t ndx) const
  853. {
  854. update_if_needed();
  855. return m_set.get(virtual2real(ndx));
  856. }
  857. inline size_t LnkSet::find(ObjKey value) const
  858. {
  859. update_if_needed();
  860. if (value.is_unresolved()) {
  861. return not_found;
  862. }
  863. size_t ndx = m_set.find(value);
  864. if (ndx == not_found) {
  865. return not_found;
  866. }
  867. return real2virtual(ndx);
  868. }
  869. inline size_t LnkSet::find_first(ObjKey value) const
  870. {
  871. return find(value);
  872. }
  873. inline size_t LnkSet::size() const
  874. {
  875. update_if_needed();
  876. return m_set.size() - num_unresolved();
  877. }
  878. inline std::pair<size_t, bool> LnkSet::insert(ObjKey value)
  879. {
  880. REALM_ASSERT(!value.is_unresolved());
  881. update_if_needed();
  882. auto [ndx, inserted] = m_set.insert(value);
  883. return {real2virtual(ndx), inserted};
  884. }
  885. inline std::pair<size_t, bool> LnkSet::erase(ObjKey value)
  886. {
  887. REALM_ASSERT(!value.is_unresolved());
  888. update_if_needed();
  889. auto [ndx, removed] = m_set.erase(value);
  890. if (removed) {
  891. ndx = real2virtual(ndx);
  892. }
  893. return {ndx, removed};
  894. }
  895. inline bool LnkSet::is_null(size_t ndx) const
  896. {
  897. update_if_needed();
  898. return m_set.is_null(virtual2real(ndx));
  899. }
  900. inline Mixed LnkSet::get_any(size_t ndx) const
  901. {
  902. update_if_needed();
  903. return m_set.get_any(virtual2real(ndx));
  904. }
  905. inline std::pair<size_t, bool> LnkSet::insert_null()
  906. {
  907. update_if_needed();
  908. auto [ndx, inserted] = m_set.insert_null();
  909. return {real2virtual(ndx), inserted};
  910. }
  911. inline std::pair<size_t, bool> LnkSet::erase_null()
  912. {
  913. update_if_needed();
  914. auto [ndx, erased] = m_set.erase_null();
  915. if (erased) {
  916. ndx = real2virtual(ndx);
  917. }
  918. return {ndx, erased};
  919. }
  920. inline std::pair<size_t, bool> LnkSet::insert_any(Mixed value)
  921. {
  922. update_if_needed();
  923. auto [ndx, inserted] = m_set.insert_any(value);
  924. return {real2virtual(ndx), inserted};
  925. }
  926. inline std::pair<size_t, bool> LnkSet::erase_any(Mixed value)
  927. {
  928. auto [ndx, erased] = m_set.erase_any(value);
  929. if (erased) {
  930. ndx = real2virtual(ndx);
  931. }
  932. return {ndx, erased};
  933. }
  934. inline void LnkSet::clear()
  935. {
  936. m_set.clear();
  937. clear_unresolved();
  938. }
  939. inline util::Optional<Mixed> LnkSet::min(size_t* return_ndx) const
  940. {
  941. size_t found = not_found;
  942. auto value = m_set.min(&found);
  943. if (found != not_found && return_ndx) {
  944. *return_ndx = real2virtual(found);
  945. }
  946. return value;
  947. }
  948. inline util::Optional<Mixed> LnkSet::max(size_t* return_ndx) const
  949. {
  950. size_t found = not_found;
  951. auto value = m_set.max(&found);
  952. if (found != not_found && return_ndx) {
  953. *return_ndx = real2virtual(found);
  954. }
  955. return value;
  956. }
  957. inline util::Optional<Mixed> LnkSet::sum(size_t* return_cnt) const
  958. {
  959. static_cast<void>(return_cnt);
  960. REALM_TERMINATE("Not implemented");
  961. }
  962. inline util::Optional<Mixed> LnkSet::avg(size_t* return_cnt) const
  963. {
  964. static_cast<void>(return_cnt);
  965. REALM_TERMINATE("Not implemented");
  966. }
  967. inline void LnkSet::sort(std::vector<size_t>& indices, bool ascending) const
  968. {
  969. update_if_needed();
  970. // Map the input indices to real indices.
  971. std::transform(indices.begin(), indices.end(), indices.begin(), [this](size_t ndx) {
  972. return virtual2real(ndx);
  973. });
  974. m_set.sort(indices, ascending);
  975. // Map the output indices to virtual indices.
  976. std::transform(indices.begin(), indices.end(), indices.begin(), [this](size_t ndx) {
  977. return real2virtual(ndx);
  978. });
  979. }
  980. inline void LnkSet::distinct(std::vector<size_t>& indices, util::Optional<bool> sort_order) const
  981. {
  982. update_if_needed();
  983. // Map the input indices to real indices.
  984. std::transform(indices.begin(), indices.end(), indices.begin(), [this](size_t ndx) {
  985. return virtual2real(ndx);
  986. });
  987. m_set.distinct(indices, sort_order);
  988. // Map the output indices to virtual indices.
  989. std::transform(indices.begin(), indices.end(), indices.begin(), [this](size_t ndx) {
  990. return real2virtual(ndx);
  991. });
  992. }
  993. inline const Obj& LnkSet::get_obj() const noexcept
  994. {
  995. return m_set.get_obj();
  996. }
  997. inline bool LnkSet::is_attached() const
  998. {
  999. return m_set.is_attached();
  1000. }
  1001. inline bool LnkSet::has_changed() const
  1002. {
  1003. return m_set.has_changed();
  1004. }
  1005. inline ColKey LnkSet::get_col_key() const noexcept
  1006. {
  1007. return m_set.get_col_key();
  1008. }
  1009. inline size_t LnkSet::find_any(Mixed value) const
  1010. {
  1011. if (value.is_null())
  1012. return not_found;
  1013. if (value.get_type() != type_Link)
  1014. return not_found;
  1015. size_t found = find(value.get<ObjKey>());
  1016. if (found != not_found) {
  1017. found = real2virtual(found);
  1018. }
  1019. return found;
  1020. }
  1021. inline bool LnkSet::is_obj_valid(size_t) const noexcept
  1022. {
  1023. // LnkSet cannot contain NULL links.
  1024. return true;
  1025. }
  1026. inline Obj LnkSet::get_object(size_t ndx) const
  1027. {
  1028. ObjKey key = get(ndx);
  1029. return get_target_table()->get_object(key);
  1030. }
  1031. inline ObjKey LnkSet::get_key(size_t ndx) const
  1032. {
  1033. return get(ndx);
  1034. }
  1035. inline void LnkSet::assign_union(const CollectionBase& rhs)
  1036. {
  1037. m_set.assign_union(rhs);
  1038. update_unresolved();
  1039. }
  1040. inline void LnkSet::assign_intersection(const CollectionBase& rhs)
  1041. {
  1042. m_set.assign_intersection(rhs);
  1043. update_unresolved();
  1044. }
  1045. inline void LnkSet::assign_difference(const CollectionBase& rhs)
  1046. {
  1047. m_set.assign_difference(rhs);
  1048. update_unresolved();
  1049. }
  1050. inline void LnkSet::assign_symmetric_difference(const CollectionBase& rhs)
  1051. {
  1052. m_set.assign_symmetric_difference(rhs);
  1053. update_unresolved();
  1054. }
  1055. } // namespace realm
  1056. #endif // REALM_SET_HPP