queue.hpp 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737
  1. /* Declarations for the queue template type.
  2. This file is part of xrcu.
  3. xrcu is free software: you can redistribute it and/or modify
  4. it under the terms of the GNU General Public License as published by
  5. the Free Software Foundation; either version 3 of the License, or
  6. (at your option) any later version.
  7. This program is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU General Public License for more details.
  11. You should have received a copy of the GNU General Public License
  12. along with this program. If not, see <https://www.gnu.org/licenses/>. */
  13. #ifndef __XRCU_QUEUE_HPP__
  14. #define __XRCU_QUEUE_HPP__ 1
  15. #include "xrcu.hpp"
  16. #include "optional.hpp"
  17. #include "xatomic.hpp"
  18. #include "utils.hpp"
  19. #include <cstddef>
  20. #include <atomic>
  21. #include <type_traits>
  22. #include <initializer_list>
  23. namespace std
  24. {
  25. struct forward_iterator_tag;
  26. }
  27. namespace xrcu
  28. {
  29. namespace detail
  30. {
  31. static inline uint32_t upsize (uint32_t x)
  32. {
  33. x |= x >> 1;
  34. x |= x >> 2;
  35. x |= x >> 4;
  36. x |= x >> 8;
  37. x |= x >> 16;
  38. return (x + 1);
  39. }
  40. static inline uint64_t upsize (uint64_t x)
  41. {
  42. x |= x >> 1;
  43. x |= x >> 2;
  44. x |= x >> 4;
  45. x |= x >> 8;
  46. x |= x >> 16;
  47. x |= x >> 32;
  48. return (x + 1);
  49. }
  50. struct alignas (uintptr_t) q_data : public finalizable
  51. {
  52. uintptr_t *ptrs;
  53. size_t cap;
  54. std::atomic<size_t> wr_idx;
  55. std::atomic<size_t> rd_idx;
  56. static q_data* make (size_t cnt, uintptr_t empty);
  57. size_t _Wridx () const
  58. {
  59. return (this->wr_idx.load (std::memory_order_relaxed));
  60. }
  61. size_t _Rdidx () const
  62. {
  63. return (this->rd_idx.load (std::memory_order_relaxed));
  64. }
  65. bool push (uintptr_t val, uintptr_t xbit, uintptr_t empty)
  66. {
  67. while (true)
  68. {
  69. size_t curr = this->_Wridx ();
  70. if (curr >= this->cap)
  71. return (false);
  72. uintptr_t xv = this->ptrs[curr];
  73. if ((xv & xbit) != 0)
  74. return (false);
  75. else if (xv == empty &&
  76. xatomic_cas_bool (&this->ptrs[curr], xv, val))
  77. {
  78. this->wr_idx.fetch_add (1, std::memory_order_acq_rel);
  79. return (true);
  80. }
  81. xatomic_spin_nop ();
  82. }
  83. }
  84. uintptr_t pop (uintptr_t xbit, uintptr_t dfl)
  85. {
  86. while (true)
  87. {
  88. size_t curr = this->_Rdidx ();
  89. if (curr >= this->_Wridx ())
  90. return (dfl);
  91. uintptr_t rv = this->ptrs[curr];
  92. if (rv & xbit)
  93. return (xbit);
  94. else if (rv != dfl && xatomic_cas_bool (&this->ptrs[curr], rv, dfl))
  95. {
  96. this->rd_idx.fetch_add (1, std::memory_order_relaxed);
  97. return (rv);
  98. }
  99. xatomic_spin_nop ();
  100. }
  101. }
  102. uintptr_t front () const
  103. {
  104. return (this->ptrs[this->_Rdidx ()]);
  105. }
  106. uintptr_t back () const
  107. {
  108. size_t idx = this->_Wridx ();
  109. if (idx == 0)
  110. return (this->ptrs[this->cap]);
  111. return (this->ptrs[idx - 1]);
  112. }
  113. size_t size () const
  114. {
  115. return (this->_Wridx () - this->_Rdidx ());
  116. }
  117. void safe_destroy ();
  118. };
  119. inline void
  120. q_replace_cb (std::atomic<q_data *>& ptr, q_data *old, q_data *nq, uintptr_t)
  121. {
  122. finalize (old);
  123. ptr.store (nq, std::memory_order_relaxed);
  124. }
  125. inline void
  126. q_clear_cb (std::atomic<q_data *>&, q_data *old, q_data *, uintptr_t empty)
  127. {
  128. old->wr_idx.store (old->cap, std::memory_order_relaxed);
  129. old->rd_idx.store (old->cap, std::memory_order_relaxed);
  130. for (size_t i = 0; i < old->cap; ++i)
  131. old->ptrs[i] = empty;
  132. old->rd_idx.store (0, std::memory_order_release);
  133. old->wr_idx.store (0, std::memory_order_release);
  134. }
  135. } // namespace detail
  136. template <class T>
  137. struct queue
  138. {
  139. typedef detail::wrapped_traits<(sizeof (T) < sizeof (uintptr_t) &&
  140. std::is_integral<T>::value) || (std::is_pointer<T>::value &&
  141. alignof (T) >= 8), T> val_traits;
  142. std::atomic<detail::q_data *> impl;
  143. typedef T value_type;
  144. typedef T& reference;
  145. typedef const T& const_reference;
  146. typedef T* pointer;
  147. typedef const T* const_pointer;
  148. typedef ptrdiff_t difference_type;
  149. typedef size_t size_type;
  150. void _Init (size_t size)
  151. {
  152. this->impl = detail::q_data::make (size, val_traits::FREE);
  153. }
  154. detail::q_data* _Data ()
  155. {
  156. return (this->impl.load (std::memory_order_relaxed));
  157. }
  158. const detail::q_data* _Data () const
  159. {
  160. return (this->impl.load (std::memory_order_relaxed));
  161. }
  162. void _Set_data (detail::q_data *qdp)
  163. {
  164. this->impl.store (qdp, std::memory_order_relaxed);
  165. }
  166. struct iterator : public cs_guard
  167. {
  168. const detail::q_data *qdp;
  169. size_t idx;
  170. uintptr_t c_val;
  171. typedef std::forward_iterator_tag iterator_category;
  172. iterator (const detail::q_data *q, size_t s) : qdp (q), idx (s)
  173. {
  174. if (this->qdp)
  175. this->_Adv ();
  176. }
  177. iterator (const iterator& it) :
  178. qdp (it.qdp), idx (it.idx), c_val (it.c_val)
  179. {
  180. }
  181. iterator (iterator&& it) : qdp (it.qdp), idx (it.idx), c_val (it.c_val)
  182. {
  183. it.qdp = nullptr;
  184. }
  185. void _Adv ()
  186. {
  187. for (; this->idx < this->qdp->cap; ++this->idx)
  188. {
  189. this->c_val = this->qdp->ptrs[this->idx] & ~val_traits::XBIT;
  190. if (this->c_val != val_traits::DELT &&
  191. this->c_val != val_traits::FREE)
  192. return;
  193. }
  194. this->qdp = nullptr;
  195. this->idx = 0;
  196. }
  197. T operator* ()
  198. {
  199. return (val_traits::get (this->c_val));
  200. }
  201. iterator& operator++ ()
  202. {
  203. ++this->idx;
  204. this->_Adv ();
  205. return (*this);
  206. }
  207. iterator operator++ (int)
  208. {
  209. iterator rv { *this };
  210. ++*this;
  211. return (rv);
  212. }
  213. bool operator== (const iterator& it) const
  214. {
  215. return (this->qdp == it.qdp && this->idx == it.idx);
  216. }
  217. bool operator!= (const iterator& it) const
  218. {
  219. return (!(*this == it));
  220. }
  221. };
  222. typedef iterator const_iterator;
  223. queue ()
  224. {
  225. this->_Init (8);
  226. }
  227. template <class T1, class T2>
  228. void _Init (T1 n, const T2& val, std::true_type)
  229. {
  230. size_t ns = (size_t)n;
  231. auto qdp = detail::q_data::make (detail::upsize (ns), val_traits::FREE);
  232. try
  233. {
  234. for (size_t i = 0; i < ns; )
  235. {
  236. qdp->ptrs[i] = val_traits::make (val);
  237. qdp->wr_idx.store (++i, std::memory_order_relaxed);
  238. }
  239. }
  240. catch (...)
  241. {
  242. _Destroy (qdp);
  243. throw;
  244. }
  245. this->_Set_data (qdp);
  246. }
  247. template <class It>
  248. void _Init (It first, It last, std::false_type)
  249. {
  250. auto qdp = detail::q_data::make (8, val_traits::FREE);
  251. try
  252. {
  253. for (size_t i = 0; first != last; ++first)
  254. {
  255. qdp->ptrs[i] = val_traits::make (*first);
  256. qdp->wr_idx.store (++i, std::memory_order_relaxed);
  257. if (i == qdp->cap)
  258. {
  259. auto q2 = detail::q_data::make (i * 2, val_traits::FREE);
  260. for (size_t j = 0; j < i; ++j)
  261. q2->ptrs[j] = qdp->ptrs[j];
  262. qdp->safe_destroy ();
  263. qdp = q2;
  264. }
  265. }
  266. }
  267. catch (...)
  268. {
  269. _Destroy (qdp);
  270. throw;
  271. }
  272. this->_Set_data (qdp);
  273. }
  274. template <class T1, class T2>
  275. queue (T1 first, T2 last)
  276. {
  277. this->_Init (first, last, typename std::is_integral<T1>::type ());
  278. }
  279. queue (const queue<T>& right) : queue (right.begin (), right.end ())
  280. {
  281. }
  282. queue (queue<T>&& right)
  283. {
  284. this->_Set_data (right._Data ());
  285. right._Set_data (nullptr);
  286. }
  287. queue (std::initializer_list<T> lst) : queue (lst.begin (), lst.end ())
  288. {
  289. }
  290. bool _Rearm (uintptr_t elem, detail::q_data *qdp)
  291. {
  292. size_t ix;
  293. uintptr_t prev;
  294. while (true)
  295. {
  296. ix = qdp->_Rdidx ();
  297. prev = xatomic_or (&qdp->ptrs[ix], val_traits::XBIT);
  298. if (prev == val_traits::DELT)
  299. { // Another thread deleted this entry - Retry.
  300. xatomic_spin_nop ();
  301. continue;
  302. }
  303. else if ((prev & val_traits::XBIT) == 0)
  304. break;
  305. while (true)
  306. {
  307. if (qdp != this->_Data ())
  308. // Impl pointer has been installed - Return.
  309. return (false);
  310. else if ((qdp->ptrs[ix] & val_traits::XBIT) == 0)
  311. /* The thread rearming the queue raised an exception.
  312. * Recurse and see if we can pick up the slack. */
  313. return (this->_Rearm (elem, qdp));
  314. xatomic_spin_nop ();
  315. }
  316. }
  317. detail::q_data *nq = nullptr;
  318. try
  319. {
  320. nq = detail::q_data::make (qdp->cap * 2, val_traits::FREE);
  321. }
  322. catch (...)
  323. {
  324. xatomic_and (&qdp->ptrs[ix], ~val_traits::XBIT);
  325. val_traits::free (elem);
  326. throw;
  327. }
  328. uintptr_t *outp = nq->ptrs;
  329. for (*outp++ = prev; ++ix < qdp->cap; )
  330. *outp++ = xatomic_or (&qdp->ptrs[ix], val_traits::XBIT);
  331. *outp++ = elem;
  332. nq->wr_idx.store (outp - nq->ptrs, std::memory_order_relaxed);
  333. finalize (qdp);
  334. this->_Set_data (nq);
  335. return (true);
  336. }
  337. void _Push (uintptr_t val)
  338. {
  339. while (true)
  340. {
  341. auto qdp = this->_Data ();
  342. if (qdp->push (val, val_traits::XBIT, val_traits::FREE) ||
  343. this->_Rearm (val, qdp))
  344. break;
  345. }
  346. }
  347. void push (const T& elem)
  348. {
  349. cs_guard g;
  350. this->_Push (val_traits::make (elem));
  351. }
  352. template <class ...Args>
  353. void emplace (Args&& ...args)
  354. {
  355. cs_guard g;
  356. this->_Push (val_traits::make (std::forward<Args>(args)...));
  357. }
  358. optional<T> pop ()
  359. {
  360. cs_guard g;
  361. while (true)
  362. {
  363. auto qdp = this->_Data ();
  364. uintptr_t val = qdp->pop (val_traits::XBIT, val_traits::DELT);
  365. if (val == val_traits::DELT)
  366. // Queue is empty.
  367. return (optional<T> ());
  368. else if (val != val_traits::XBIT)
  369. {
  370. val_traits::destroy (val);
  371. optional<T> rv (val_traits::get (val));
  372. return (rv);
  373. }
  374. while (qdp == this->_Data ())
  375. xatomic_spin_nop ();
  376. }
  377. }
  378. optional<T> front () const
  379. {
  380. cs_guard g;
  381. while (true)
  382. {
  383. uintptr_t rv = this->_Data()->front () & ~val_traits::XBIT;
  384. if (rv == val_traits::DELT)
  385. { // Just popped the item from the queue - Retry.
  386. xatomic_spin_nop ();
  387. continue;
  388. }
  389. else if (rv == val_traits::FREE)
  390. return (optional<T> ());
  391. return (optional<T> (val_traits::get (rv)));
  392. }
  393. }
  394. optional<T> back () const
  395. {
  396. cs_guard g;
  397. while (true)
  398. {
  399. uintptr_t rv = this->_Data()->back () & ~val_traits::XBIT;
  400. if (rv == val_traits::DELT)
  401. {
  402. xatomic_spin_nop ();
  403. continue;
  404. }
  405. else if (rv == val_traits::FREE)
  406. return (optional<T> ());
  407. return (optional<T> (val_traits::get (rv)));
  408. }
  409. }
  410. size_t size () const
  411. {
  412. cs_guard g;
  413. return (this->_Data()->size ());
  414. }
  415. bool empty () const
  416. {
  417. return (this->size () == 0);
  418. }
  419. size_t max_size () const
  420. {
  421. return (~(size_t)0);
  422. }
  423. iterator begin () const
  424. {
  425. cs_guard g;
  426. auto qdp = this->_Data ();
  427. return (iterator (qdp, qdp->_Rdidx ()));
  428. }
  429. iterator end () const
  430. {
  431. return (iterator (nullptr, 0));
  432. }
  433. const_iterator cbegin () const
  434. {
  435. return (this->begin ());
  436. }
  437. const_iterator cend () const
  438. {
  439. return (this->end ());
  440. }
  441. void _Call_cb (detail::q_data *nq, uintptr_t xv,
  442. void (*f) (std::atomic<detail::q_data *>&,
  443. detail::q_data *, detail::q_data *, uintptr_t))
  444. {
  445. while (true)
  446. {
  447. auto qdp = this->_Data ();
  448. size_t ix = qdp->_Rdidx ();
  449. uintptr_t prev = xatomic_or (&qdp->ptrs[ix], val_traits::XBIT);
  450. if (prev == val_traits::DELT)
  451. continue;
  452. else if ((prev & val_traits::XBIT) == 0)
  453. {
  454. if (prev != val_traits::FREE)
  455. val_traits::destroy (prev);
  456. while (++ix < qdp->cap)
  457. {
  458. prev = xatomic_or (&qdp->ptrs[ix], val_traits::XBIT);
  459. if (prev != val_traits::FREE && prev != val_traits::DELT)
  460. val_traits::destroy (prev);
  461. }
  462. f (this->impl, qdp, nq, xv);
  463. return;
  464. }
  465. while (true)
  466. {
  467. if (qdp != this->_Data () ||
  468. (qdp->ptrs[ix] & val_traits::XBIT) == 0)
  469. break;
  470. xatomic_spin_nop ();
  471. }
  472. }
  473. }
  474. void _Assign (detail::q_data *nq)
  475. {
  476. this->_Call_cb (nq, 0, detail::q_replace_cb);
  477. }
  478. template <class T1, class T2>
  479. void assign (T1 first, T2 last)
  480. {
  481. cs_guard g;
  482. auto tmp = queue<T> (first, last);
  483. this->_Assign (tmp._Data ());
  484. tmp._Set_data (nullptr);
  485. }
  486. void assign (std::initializer_list<T> lst)
  487. {
  488. this->assign (lst.begin (), lst.end ());
  489. }
  490. queue<T>& operator= (const queue<T>& right)
  491. {
  492. if (this == &right)
  493. return (*this);
  494. this->assign (right.begin (), right.end ());
  495. return (*this);
  496. }
  497. bool operator== (const queue<T>& right) const
  498. {
  499. auto x1 = this->cbegin (), x2 = this->cend ();
  500. auto y1 = right.cbegin (), y2 = right.cend ();
  501. for (; x1 != x2 && y1 != y2; ++x1, ++y1)
  502. if (*x1 != *y1)
  503. return (false);
  504. return (x1 == x2 && y1 == y2);
  505. }
  506. bool operator!= (const queue<T>& right) const
  507. {
  508. return (!(*this == right));
  509. }
  510. bool operator< (const queue<T>& right) const
  511. {
  512. auto x1 = this->cbegin (), x2 = this->cend ();
  513. auto y1 = right.cbegin (), y2 = right.cend ();
  514. for (; x1 != x2; ++x1, ++y1)
  515. {
  516. if (y1 == y2 || *y1 < *x1)
  517. return (false);
  518. else if (*x1 < *y1)
  519. return (true);
  520. }
  521. return (y1 != y2);
  522. }
  523. bool operator> (const queue<T>& right) const
  524. {
  525. return (right < *this);
  526. }
  527. bool operator<= (const queue<T>& right) const
  528. {
  529. return (!(right < *this));
  530. }
  531. bool operator>= (const queue<T>& right) const
  532. {
  533. return (!(*this < right));
  534. }
  535. queue<T>& operator= (queue<T>&& right)
  536. {
  537. auto prev = this->impl.exchange (right._Data (),
  538. std::memory_order_acq_rel);
  539. finalize (prev);
  540. right._Set_data (nullptr);
  541. return (*this);
  542. }
  543. static void _Destroy (detail::q_data *qdp)
  544. {
  545. for (size_t i = qdp->_Rdidx (); i < qdp->cap; ++i)
  546. {
  547. uintptr_t val = qdp->ptrs[i] & ~val_traits::XBIT;
  548. if (val != val_traits::FREE && val != val_traits::DELT)
  549. val_traits::free (val);
  550. }
  551. qdp->safe_destroy ();
  552. }
  553. void clear ()
  554. {
  555. cs_guard g;
  556. this->_Call_cb (nullptr, val_traits::FREE, detail::q_clear_cb);
  557. }
  558. size_t _Lock ()
  559. {
  560. while (true)
  561. {
  562. auto qdp = this->_Data ();
  563. size_t ix = qdp->_Rdidx ();
  564. uintptr_t prev = xatomic_or (&qdp->ptrs[ix], val_traits::XBIT);
  565. if ((prev & val_traits::XBIT) == 0)
  566. return (qdp->wr_idx.exchange (qdp->cap,
  567. std::memory_order_acq_rel));
  568. while (qdp == this->_Data () &&
  569. (qdp->ptrs[ix] & val_traits::XBIT) != 0)
  570. xatomic_spin_nop ();
  571. }
  572. }
  573. void swap (queue<T>& right)
  574. {
  575. if (this == &right)
  576. return;
  577. size_t s1 = this->_Lock ();
  578. size_t s2 = right._Lock ();
  579. auto tmp = this->_Data ();
  580. this->_Set_data (right._Data ());
  581. right._Set_data (tmp);
  582. auto d1 = this->_Data();
  583. auto d2 = right._Data();
  584. d1->wr_idx.store (s2, std::memory_order_relaxed);
  585. d2->wr_idx.store (s1, std::memory_order_relaxed);
  586. d1->ptrs[d1->_Rdidx ()] &= ~val_traits::XBIT;
  587. d2->ptrs[d2->_Rdidx ()] &= ~val_traits::XBIT;
  588. }
  589. ~queue ()
  590. {
  591. auto qdp = this->_Data ();
  592. if (!qdp)
  593. return;
  594. _Destroy (qdp);
  595. this->_Set_data (nullptr);
  596. }
  597. };
  598. } // namespace xrcu
  599. namespace std
  600. {
  601. template <class T>
  602. void swap (xrcu::queue<T>& left, xrcu::queue<T>& right)
  603. {
  604. left.swap (right);
  605. }
  606. } // namespace std
  607. #endif