util.h 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594
  1. /* SPDX-License-Identifier: GPL-2.0 */
  2. #ifndef _BCACHE_UTIL_H
  3. #define _BCACHE_UTIL_H
  4. #include <linux/blkdev.h>
  5. #include <linux/errno.h>
  6. #include <linux/kernel.h>
  7. #include <linux/sched/clock.h>
  8. #include <linux/llist.h>
  9. #include <linux/ratelimit.h>
  10. #include <linux/vmalloc.h>
  11. #include <linux/workqueue.h>
  12. #include <linux/crc64.h>
  13. #include "closure.h"
  14. #define PAGE_SECTORS (PAGE_SIZE / 512)
  15. struct closure;
  16. #ifdef CONFIG_BCACHE_DEBUG
  17. #define EBUG_ON(cond) BUG_ON(cond)
  18. #define atomic_dec_bug(v) BUG_ON(atomic_dec_return(v) < 0)
  19. #define atomic_inc_bug(v, i) BUG_ON(atomic_inc_return(v) <= i)
  20. #else /* DEBUG */
  21. #define EBUG_ON(cond) do { if (cond); } while (0)
  22. #define atomic_dec_bug(v) atomic_dec(v)
  23. #define atomic_inc_bug(v, i) atomic_inc(v)
  24. #endif
  25. #define DECLARE_HEAP(type, name) \
  26. struct { \
  27. size_t size, used; \
  28. type *data; \
  29. } name
  30. #define init_heap(heap, _size, gfp) \
  31. ({ \
  32. size_t _bytes; \
  33. (heap)->used = 0; \
  34. (heap)->size = (_size); \
  35. _bytes = (heap)->size * sizeof(*(heap)->data); \
  36. (heap)->data = kvmalloc(_bytes, (gfp) & GFP_KERNEL); \
  37. (heap)->data; \
  38. })
  39. #define free_heap(heap) \
  40. do { \
  41. kvfree((heap)->data); \
  42. (heap)->data = NULL; \
  43. } while (0)
  44. #define heap_swap(h, i, j) swap((h)->data[i], (h)->data[j])
  45. #define heap_sift(h, i, cmp) \
  46. do { \
  47. size_t _r, _j = i; \
  48. \
  49. for (; _j * 2 + 1 < (h)->used; _j = _r) { \
  50. _r = _j * 2 + 1; \
  51. if (_r + 1 < (h)->used && \
  52. cmp((h)->data[_r], (h)->data[_r + 1])) \
  53. _r++; \
  54. \
  55. if (cmp((h)->data[_r], (h)->data[_j])) \
  56. break; \
  57. heap_swap(h, _r, _j); \
  58. } \
  59. } while (0)
  60. #define heap_sift_down(h, i, cmp) \
  61. do { \
  62. while (i) { \
  63. size_t p = (i - 1) / 2; \
  64. if (cmp((h)->data[i], (h)->data[p])) \
  65. break; \
  66. heap_swap(h, i, p); \
  67. i = p; \
  68. } \
  69. } while (0)
  70. #define heap_add(h, d, cmp) \
  71. ({ \
  72. bool _r = !heap_full(h); \
  73. if (_r) { \
  74. size_t _i = (h)->used++; \
  75. (h)->data[_i] = d; \
  76. \
  77. heap_sift_down(h, _i, cmp); \
  78. heap_sift(h, _i, cmp); \
  79. } \
  80. _r; \
  81. })
  82. #define heap_pop(h, d, cmp) \
  83. ({ \
  84. bool _r = (h)->used; \
  85. if (_r) { \
  86. (d) = (h)->data[0]; \
  87. (h)->used--; \
  88. heap_swap(h, 0, (h)->used); \
  89. heap_sift(h, 0, cmp); \
  90. } \
  91. _r; \
  92. })
  93. #define heap_peek(h) ((h)->used ? (h)->data[0] : NULL)
  94. #define heap_full(h) ((h)->used == (h)->size)
  95. #define DECLARE_FIFO(type, name) \
  96. struct { \
  97. size_t front, back, size, mask; \
  98. type *data; \
  99. } name
  100. #define fifo_for_each(c, fifo, iter) \
  101. for (iter = (fifo)->front; \
  102. c = (fifo)->data[iter], iter != (fifo)->back; \
  103. iter = (iter + 1) & (fifo)->mask)
  104. #define __init_fifo(fifo, gfp) \
  105. ({ \
  106. size_t _allocated_size, _bytes; \
  107. BUG_ON(!(fifo)->size); \
  108. \
  109. _allocated_size = roundup_pow_of_two((fifo)->size + 1); \
  110. _bytes = _allocated_size * sizeof(*(fifo)->data); \
  111. \
  112. (fifo)->mask = _allocated_size - 1; \
  113. (fifo)->front = (fifo)->back = 0; \
  114. \
  115. (fifo)->data = kvmalloc(_bytes, (gfp) & GFP_KERNEL); \
  116. (fifo)->data; \
  117. })
  118. #define init_fifo_exact(fifo, _size, gfp) \
  119. ({ \
  120. (fifo)->size = (_size); \
  121. __init_fifo(fifo, gfp); \
  122. })
  123. #define init_fifo(fifo, _size, gfp) \
  124. ({ \
  125. (fifo)->size = (_size); \
  126. if ((fifo)->size > 4) \
  127. (fifo)->size = roundup_pow_of_two((fifo)->size) - 1; \
  128. __init_fifo(fifo, gfp); \
  129. })
  130. #define free_fifo(fifo) \
  131. do { \
  132. kvfree((fifo)->data); \
  133. (fifo)->data = NULL; \
  134. } while (0)
  135. #define fifo_used(fifo) (((fifo)->back - (fifo)->front) & (fifo)->mask)
  136. #define fifo_free(fifo) ((fifo)->size - fifo_used(fifo))
  137. #define fifo_empty(fifo) (!fifo_used(fifo))
  138. #define fifo_full(fifo) (!fifo_free(fifo))
  139. #define fifo_front(fifo) ((fifo)->data[(fifo)->front])
  140. #define fifo_back(fifo) \
  141. ((fifo)->data[((fifo)->back - 1) & (fifo)->mask])
  142. #define fifo_idx(fifo, p) (((p) - &fifo_front(fifo)) & (fifo)->mask)
  143. #define fifo_push_back(fifo, i) \
  144. ({ \
  145. bool _r = !fifo_full((fifo)); \
  146. if (_r) { \
  147. (fifo)->data[(fifo)->back++] = (i); \
  148. (fifo)->back &= (fifo)->mask; \
  149. } \
  150. _r; \
  151. })
  152. #define fifo_pop_front(fifo, i) \
  153. ({ \
  154. bool _r = !fifo_empty((fifo)); \
  155. if (_r) { \
  156. (i) = (fifo)->data[(fifo)->front++]; \
  157. (fifo)->front &= (fifo)->mask; \
  158. } \
  159. _r; \
  160. })
  161. #define fifo_push_front(fifo, i) \
  162. ({ \
  163. bool _r = !fifo_full((fifo)); \
  164. if (_r) { \
  165. --(fifo)->front; \
  166. (fifo)->front &= (fifo)->mask; \
  167. (fifo)->data[(fifo)->front] = (i); \
  168. } \
  169. _r; \
  170. })
  171. #define fifo_pop_back(fifo, i) \
  172. ({ \
  173. bool _r = !fifo_empty((fifo)); \
  174. if (_r) { \
  175. --(fifo)->back; \
  176. (fifo)->back &= (fifo)->mask; \
  177. (i) = (fifo)->data[(fifo)->back] \
  178. } \
  179. _r; \
  180. })
  181. #define fifo_push(fifo, i) fifo_push_back(fifo, (i))
  182. #define fifo_pop(fifo, i) fifo_pop_front(fifo, (i))
  183. #define fifo_swap(l, r) \
  184. do { \
  185. swap((l)->front, (r)->front); \
  186. swap((l)->back, (r)->back); \
  187. swap((l)->size, (r)->size); \
  188. swap((l)->mask, (r)->mask); \
  189. swap((l)->data, (r)->data); \
  190. } while (0)
  191. #define fifo_move(dest, src) \
  192. do { \
  193. typeof(*((dest)->data)) _t; \
  194. while (!fifo_full(dest) && \
  195. fifo_pop(src, _t)) \
  196. fifo_push(dest, _t); \
  197. } while (0)
  198. /*
  199. * Simple array based allocator - preallocates a number of elements and you can
  200. * never allocate more than that, also has no locking.
  201. *
  202. * Handy because if you know you only need a fixed number of elements you don't
  203. * have to worry about memory allocation failure, and sometimes a mempool isn't
  204. * what you want.
  205. *
  206. * We treat the free elements as entries in a singly linked list, and the
  207. * freelist as a stack - allocating and freeing push and pop off the freelist.
  208. */
  209. #define DECLARE_ARRAY_ALLOCATOR(type, name, size) \
  210. struct { \
  211. type *freelist; \
  212. type data[size]; \
  213. } name
  214. #define array_alloc(array) \
  215. ({ \
  216. typeof((array)->freelist) _ret = (array)->freelist; \
  217. \
  218. if (_ret) \
  219. (array)->freelist = *((typeof((array)->freelist) *) _ret);\
  220. \
  221. _ret; \
  222. })
  223. #define array_free(array, ptr) \
  224. do { \
  225. typeof((array)->freelist) _ptr = ptr; \
  226. \
  227. *((typeof((array)->freelist) *) _ptr) = (array)->freelist; \
  228. (array)->freelist = _ptr; \
  229. } while (0)
  230. #define array_allocator_init(array) \
  231. do { \
  232. typeof((array)->freelist) _i; \
  233. \
  234. BUILD_BUG_ON(sizeof((array)->data[0]) < sizeof(void *)); \
  235. (array)->freelist = NULL; \
  236. \
  237. for (_i = (array)->data; \
  238. _i < (array)->data + ARRAY_SIZE((array)->data); \
  239. _i++) \
  240. array_free(array, _i); \
  241. } while (0)
  242. #define array_freelist_empty(array) ((array)->freelist == NULL)
  243. #define ANYSINT_MAX(t) \
  244. ((((t) 1 << (sizeof(t) * 8 - 2)) - (t) 1) * (t) 2 + (t) 1)
  245. int bch_strtoint_h(const char *cp, int *res);
  246. int bch_strtouint_h(const char *cp, unsigned int *res);
  247. int bch_strtoll_h(const char *cp, long long *res);
  248. int bch_strtoull_h(const char *cp, unsigned long long *res);
  249. static inline int bch_strtol_h(const char *cp, long *res)
  250. {
  251. #if BITS_PER_LONG == 32
  252. return bch_strtoint_h(cp, (int *) res);
  253. #else
  254. return bch_strtoll_h(cp, (long long *) res);
  255. #endif
  256. }
  257. static inline int bch_strtoul_h(const char *cp, long *res)
  258. {
  259. #if BITS_PER_LONG == 32
  260. return bch_strtouint_h(cp, (unsigned int *) res);
  261. #else
  262. return bch_strtoull_h(cp, (unsigned long long *) res);
  263. #endif
  264. }
  265. #define strtoi_h(cp, res) \
  266. (__builtin_types_compatible_p(typeof(*res), int) \
  267. ? bch_strtoint_h(cp, (void *) res) \
  268. : __builtin_types_compatible_p(typeof(*res), long) \
  269. ? bch_strtol_h(cp, (void *) res) \
  270. : __builtin_types_compatible_p(typeof(*res), long long) \
  271. ? bch_strtoll_h(cp, (void *) res) \
  272. : __builtin_types_compatible_p(typeof(*res), unsigned int) \
  273. ? bch_strtouint_h(cp, (void *) res) \
  274. : __builtin_types_compatible_p(typeof(*res), unsigned long) \
  275. ? bch_strtoul_h(cp, (void *) res) \
  276. : __builtin_types_compatible_p(typeof(*res), unsigned long long)\
  277. ? bch_strtoull_h(cp, (void *) res) : -EINVAL)
  278. #define strtoul_safe(cp, var) \
  279. ({ \
  280. unsigned long _v; \
  281. int _r = kstrtoul(cp, 10, &_v); \
  282. if (!_r) \
  283. var = _v; \
  284. _r; \
  285. })
  286. #define strtoul_safe_clamp(cp, var, min, max) \
  287. ({ \
  288. unsigned long _v; \
  289. int _r = kstrtoul(cp, 10, &_v); \
  290. if (!_r) \
  291. var = clamp_t(typeof(var), _v, min, max); \
  292. _r; \
  293. })
  294. #define snprint(buf, size, var) \
  295. snprintf(buf, size, \
  296. __builtin_types_compatible_p(typeof(var), int) \
  297. ? "%i\n" : \
  298. __builtin_types_compatible_p(typeof(var), unsigned int) \
  299. ? "%u\n" : \
  300. __builtin_types_compatible_p(typeof(var), long) \
  301. ? "%li\n" : \
  302. __builtin_types_compatible_p(typeof(var), unsigned long)\
  303. ? "%lu\n" : \
  304. __builtin_types_compatible_p(typeof(var), int64_t) \
  305. ? "%lli\n" : \
  306. __builtin_types_compatible_p(typeof(var), uint64_t) \
  307. ? "%llu\n" : \
  308. __builtin_types_compatible_p(typeof(var), const char *) \
  309. ? "%s\n" : "%i\n", var)
  310. ssize_t bch_hprint(char *buf, int64_t v);
  311. bool bch_is_zero(const char *p, size_t n);
  312. int bch_parse_uuid(const char *s, char *uuid);
  313. struct time_stats {
  314. spinlock_t lock;
  315. /*
  316. * all fields are in nanoseconds, averages are ewmas stored left shifted
  317. * by 8
  318. */
  319. uint64_t max_duration;
  320. uint64_t average_duration;
  321. uint64_t average_frequency;
  322. uint64_t last;
  323. };
  324. void bch_time_stats_update(struct time_stats *stats, uint64_t time);
  325. static inline unsigned int local_clock_us(void)
  326. {
  327. return local_clock() >> 10;
  328. }
  329. #define NSEC_PER_ns 1L
  330. #define NSEC_PER_us NSEC_PER_USEC
  331. #define NSEC_PER_ms NSEC_PER_MSEC
  332. #define NSEC_PER_sec NSEC_PER_SEC
  333. #define __print_time_stat(stats, name, stat, units) \
  334. sysfs_print(name ## _ ## stat ## _ ## units, \
  335. div_u64((stats)->stat >> 8, NSEC_PER_ ## units))
  336. #define sysfs_print_time_stats(stats, name, \
  337. frequency_units, \
  338. duration_units) \
  339. do { \
  340. __print_time_stat(stats, name, \
  341. average_frequency, frequency_units); \
  342. __print_time_stat(stats, name, \
  343. average_duration, duration_units); \
  344. sysfs_print(name ## _ ##max_duration ## _ ## duration_units, \
  345. div_u64((stats)->max_duration, \
  346. NSEC_PER_ ## duration_units)); \
  347. \
  348. sysfs_print(name ## _last_ ## frequency_units, (stats)->last \
  349. ? div_s64(local_clock() - (stats)->last, \
  350. NSEC_PER_ ## frequency_units) \
  351. : -1LL); \
  352. } while (0)
  353. #define sysfs_time_stats_attribute(name, \
  354. frequency_units, \
  355. duration_units) \
  356. read_attribute(name ## _average_frequency_ ## frequency_units); \
  357. read_attribute(name ## _average_duration_ ## duration_units); \
  358. read_attribute(name ## _max_duration_ ## duration_units); \
  359. read_attribute(name ## _last_ ## frequency_units)
  360. #define sysfs_time_stats_attribute_list(name, \
  361. frequency_units, \
  362. duration_units) \
  363. &sysfs_ ## name ## _average_frequency_ ## frequency_units, \
  364. &sysfs_ ## name ## _average_duration_ ## duration_units, \
  365. &sysfs_ ## name ## _max_duration_ ## duration_units, \
  366. &sysfs_ ## name ## _last_ ## frequency_units,
  367. #define ewma_add(ewma, val, weight, factor) \
  368. ({ \
  369. (ewma) *= (weight) - 1; \
  370. (ewma) += (val) << factor; \
  371. (ewma) /= (weight); \
  372. (ewma) >> factor; \
  373. })
  374. struct bch_ratelimit {
  375. /* Next time we want to do some work, in nanoseconds */
  376. uint64_t next;
  377. /*
  378. * Rate at which we want to do work, in units per second
  379. * The units here correspond to the units passed to bch_next_delay()
  380. */
  381. atomic_long_t rate;
  382. };
  383. static inline void bch_ratelimit_reset(struct bch_ratelimit *d)
  384. {
  385. d->next = local_clock();
  386. }
  387. uint64_t bch_next_delay(struct bch_ratelimit *d, uint64_t done);
  388. #define __DIV_SAFE(n, d, zero) \
  389. ({ \
  390. typeof(n) _n = (n); \
  391. typeof(d) _d = (d); \
  392. _d ? _n / _d : zero; \
  393. })
  394. #define DIV_SAFE(n, d) __DIV_SAFE(n, d, 0)
  395. #define container_of_or_null(ptr, type, member) \
  396. ({ \
  397. typeof(ptr) _ptr = ptr; \
  398. _ptr ? container_of(_ptr, type, member) : NULL; \
  399. })
  400. #define RB_INSERT(root, new, member, cmp) \
  401. ({ \
  402. __label__ dup; \
  403. struct rb_node **n = &(root)->rb_node, *parent = NULL; \
  404. typeof(new) this; \
  405. int res, ret = -1; \
  406. \
  407. while (*n) { \
  408. parent = *n; \
  409. this = container_of(*n, typeof(*(new)), member); \
  410. res = cmp(new, this); \
  411. if (!res) \
  412. goto dup; \
  413. n = res < 0 \
  414. ? &(*n)->rb_left \
  415. : &(*n)->rb_right; \
  416. } \
  417. \
  418. rb_link_node(&(new)->member, parent, n); \
  419. rb_insert_color(&(new)->member, root); \
  420. ret = 0; \
  421. dup: \
  422. ret; \
  423. })
  424. #define RB_SEARCH(root, search, member, cmp) \
  425. ({ \
  426. struct rb_node *n = (root)->rb_node; \
  427. typeof(&(search)) this, ret = NULL; \
  428. int res; \
  429. \
  430. while (n) { \
  431. this = container_of(n, typeof(search), member); \
  432. res = cmp(&(search), this); \
  433. if (!res) { \
  434. ret = this; \
  435. break; \
  436. } \
  437. n = res < 0 \
  438. ? n->rb_left \
  439. : n->rb_right; \
  440. } \
  441. ret; \
  442. })
  443. #define RB_GREATER(root, search, member, cmp) \
  444. ({ \
  445. struct rb_node *n = (root)->rb_node; \
  446. typeof(&(search)) this, ret = NULL; \
  447. int res; \
  448. \
  449. while (n) { \
  450. this = container_of(n, typeof(search), member); \
  451. res = cmp(&(search), this); \
  452. if (res < 0) { \
  453. ret = this; \
  454. n = n->rb_left; \
  455. } else \
  456. n = n->rb_right; \
  457. } \
  458. ret; \
  459. })
  460. #define RB_FIRST(root, type, member) \
  461. container_of_or_null(rb_first(root), type, member)
  462. #define RB_LAST(root, type, member) \
  463. container_of_or_null(rb_last(root), type, member)
  464. #define RB_NEXT(ptr, member) \
  465. container_of_or_null(rb_next(&(ptr)->member), typeof(*ptr), member)
  466. #define RB_PREV(ptr, member) \
  467. container_of_or_null(rb_prev(&(ptr)->member), typeof(*ptr), member)
  468. static inline uint64_t bch_crc64(const void *p, size_t len)
  469. {
  470. uint64_t crc = 0xffffffffffffffffULL;
  471. crc = crc64_be(crc, p, len);
  472. return crc ^ 0xffffffffffffffffULL;
  473. }
  474. static inline uint64_t bch_crc64_update(uint64_t crc,
  475. const void *p,
  476. size_t len)
  477. {
  478. crc = crc64_be(crc, p, len);
  479. return crc;
  480. }
  481. /*
  482. * A stepwise-linear pseudo-exponential. This returns 1 << (x >>
  483. * frac_bits), with the less-significant bits filled in by linear
  484. * interpolation.
  485. *
  486. * This can also be interpreted as a floating-point number format,
  487. * where the low frac_bits are the mantissa (with implicit leading
  488. * 1 bit), and the more significant bits are the exponent.
  489. * The return value is 1.mantissa * 2^exponent.
  490. *
  491. * The way this is used, fract_bits is 6 and the largest possible
  492. * input is CONGESTED_MAX-1 = 1023 (exponent 16, mantissa 0x1.fc),
  493. * so the maximum output is 0x1fc00.
  494. */
  495. static inline unsigned int fract_exp_two(unsigned int x,
  496. unsigned int fract_bits)
  497. {
  498. unsigned int mantissa = 1 << fract_bits; /* Implicit bit */
  499. mantissa += x & (mantissa - 1);
  500. x >>= fract_bits; /* The exponent */
  501. /* Largest intermediate value 0x7f0000 */
  502. return mantissa << x >> fract_bits;
  503. }
  504. void bch_bio_map(struct bio *bio, void *base);
  505. int bch_bio_alloc_pages(struct bio *bio, gfp_t gfp_mask);
  506. static inline sector_t bdev_sectors(struct block_device *bdev)
  507. {
  508. return bdev->bd_inode->i_size >> 9;
  509. }
  510. #endif /* _BCACHE_UTIL_H */