1 /* SPDX-License-Identifier: GPL-2.0 */
6 #include <linux/blkdev.h>
7 #include <linux/errno.h>
8 #include <linux/kernel.h>
9 #include <linux/sched/clock.h>
10 #include <linux/llist.h>
11 #include <linux/ratelimit.h>
12 #include <linux/vmalloc.h>
13 #include <linux/workqueue.h>
14 #include <linux/crc64.h>
20 #ifdef CONFIG_BCACHE_DEBUG
22 #define EBUG_ON(cond) BUG_ON(cond)
23 #define atomic_dec_bug(v) BUG_ON(atomic_dec_return(v) < 0)
24 #define atomic_inc_bug(v, i) BUG_ON(atomic_inc_return(v) <= i)
28 #define EBUG_ON(cond) do { if (cond) do {} while (0); } while (0)
29 #define atomic_dec_bug(v) atomic_dec(v)
30 #define atomic_inc_bug(v, i) atomic_inc(v)
34 #define DECLARE_HEAP(type, name) \
40 #define init_heap(heap, _size, gfp) \
44 (heap)->size = (_size); \
45 _bytes = (heap)->size * sizeof(*(heap)->data); \
46 (heap)->data = kvmalloc(_bytes, (gfp) & GFP_KERNEL); \
50 #define free_heap(heap) \
52 kvfree((heap)->data); \
53 (heap)->data = NULL; \
56 #define heap_swap(h, i, j) swap((h)->data[i], (h)->data[j])
58 #define heap_sift(h, i, cmp) \
62 for (; _j * 2 + 1 < (h)->used; _j = _r) { \
64 if (_r + 1 < (h)->used && \
65 cmp((h)->data[_r], (h)->data[_r + 1])) \
68 if (cmp((h)->data[_r], (h)->data[_j])) \
70 heap_swap(h, _r, _j); \
74 #define heap_sift_down(h, i, cmp) \
77 size_t p = (i - 1) / 2; \
78 if (cmp((h)->data[i], (h)->data[p])) \
85 #define heap_add(h, d, cmp) \
87 bool _r = !heap_full(h); \
89 size_t _i = (h)->used++; \
92 heap_sift_down(h, _i, cmp); \
93 heap_sift(h, _i, cmp); \
98 #define heap_pop(h, d, cmp) \
100 bool _r = (h)->used; \
102 (d) = (h)->data[0]; \
104 heap_swap(h, 0, (h)->used); \
105 heap_sift(h, 0, cmp); \
110 #define heap_peek(h) ((h)->used ? (h)->data[0] : NULL)
112 #define heap_full(h) ((h)->used == (h)->size)
114 #define DECLARE_FIFO(type, name) \
116 size_t front, back, size, mask; \
120 #define fifo_for_each(c, fifo, iter) \
121 for (iter = (fifo)->front; \
122 c = (fifo)->data[iter], iter != (fifo)->back; \
123 iter = (iter + 1) & (fifo)->mask)
125 #define __init_fifo(fifo, gfp) \
127 size_t _allocated_size, _bytes; \
128 BUG_ON(!(fifo)->size); \
130 _allocated_size = roundup_pow_of_two((fifo)->size + 1); \
131 _bytes = _allocated_size * sizeof(*(fifo)->data); \
133 (fifo)->mask = _allocated_size - 1; \
134 (fifo)->front = (fifo)->back = 0; \
136 (fifo)->data = kvmalloc(_bytes, (gfp) & GFP_KERNEL); \
140 #define init_fifo_exact(fifo, _size, gfp) \
142 (fifo)->size = (_size); \
143 __init_fifo(fifo, gfp); \
146 #define init_fifo(fifo, _size, gfp) \
148 (fifo)->size = (_size); \
149 if ((fifo)->size > 4) \
150 (fifo)->size = roundup_pow_of_two((fifo)->size) - 1; \
151 __init_fifo(fifo, gfp); \
154 #define free_fifo(fifo) \
156 kvfree((fifo)->data); \
157 (fifo)->data = NULL; \
160 #define fifo_used(fifo) (((fifo)->back - (fifo)->front) & (fifo)->mask)
161 #define fifo_free(fifo) ((fifo)->size - fifo_used(fifo))
163 #define fifo_empty(fifo) (!fifo_used(fifo))
164 #define fifo_full(fifo) (!fifo_free(fifo))
166 #define fifo_front(fifo) ((fifo)->data[(fifo)->front])
167 #define fifo_back(fifo) \
168 ((fifo)->data[((fifo)->back - 1) & (fifo)->mask])
170 #define fifo_idx(fifo, p) (((p) - &fifo_front(fifo)) & (fifo)->mask)
172 #define fifo_push_back(fifo, i) \
174 bool _r = !fifo_full((fifo)); \
176 (fifo)->data[(fifo)->back++] = (i); \
177 (fifo)->back &= (fifo)->mask; \
182 #define fifo_pop_front(fifo, i) \
184 bool _r = !fifo_empty((fifo)); \
186 (i) = (fifo)->data[(fifo)->front++]; \
187 (fifo)->front &= (fifo)->mask; \
192 #define fifo_push_front(fifo, i) \
194 bool _r = !fifo_full((fifo)); \
197 (fifo)->front &= (fifo)->mask; \
198 (fifo)->data[(fifo)->front] = (i); \
203 #define fifo_pop_back(fifo, i) \
205 bool _r = !fifo_empty((fifo)); \
208 (fifo)->back &= (fifo)->mask; \
209 (i) = (fifo)->data[(fifo)->back] \
214 #define fifo_push(fifo, i) fifo_push_back(fifo, (i))
215 #define fifo_pop(fifo, i) fifo_pop_front(fifo, (i))
217 #define fifo_swap(l, r) \
219 swap((l)->front, (r)->front); \
220 swap((l)->back, (r)->back); \
221 swap((l)->size, (r)->size); \
222 swap((l)->mask, (r)->mask); \
223 swap((l)->data, (r)->data); \
226 #define fifo_move(dest, src) \
228 typeof(*((dest)->data)) _t; \
229 while (!fifo_full(dest) && \
231 fifo_push(dest, _t); \
235 * Simple array based allocator - preallocates a number of elements and you can
236 * never allocate more than that, also has no locking.
238 * Handy because if you know you only need a fixed number of elements you don't
239 * have to worry about memory allocation failure, and sometimes a mempool isn't
242 * We treat the free elements as entries in a singly linked list, and the
243 * freelist as a stack - allocating and freeing push and pop off the freelist.
246 #define DECLARE_ARRAY_ALLOCATOR(type, name, size) \
252 #define array_alloc(array) \
254 typeof((array)->freelist) _ret = (array)->freelist; \
257 (array)->freelist = *((typeof((array)->freelist) *) _ret);\
262 #define array_free(array, ptr) \
264 typeof((array)->freelist) _ptr = ptr; \
266 *((typeof((array)->freelist) *) _ptr) = (array)->freelist; \
267 (array)->freelist = _ptr; \
270 #define array_allocator_init(array) \
272 typeof((array)->freelist) _i; \
274 BUILD_BUG_ON(sizeof((array)->data[0]) < sizeof(void *)); \
275 (array)->freelist = NULL; \
277 for (_i = (array)->data; \
278 _i < (array)->data + ARRAY_SIZE((array)->data); \
280 array_free(array, _i); \
283 #define array_freelist_empty(array) ((array)->freelist == NULL)
285 #define ANYSINT_MAX(t) \
286 ((((t) 1 << (sizeof(t) * 8 - 2)) - (t) 1) * (t) 2 + (t) 1)
288 int bch_strtoint_h(const char *cp, int *res);
289 int bch_strtouint_h(const char *cp, unsigned int *res);
290 int bch_strtoll_h(const char *cp, long long *res);
291 int bch_strtoull_h(const char *cp, unsigned long long *res);
293 static inline int bch_strtol_h(const char *cp, long *res)
295 #if BITS_PER_LONG == 32
296 return bch_strtoint_h(cp, (int *) res);
298 return bch_strtoll_h(cp, (long long *) res);
302 static inline int bch_strtoul_h(const char *cp, long *res)
304 #if BITS_PER_LONG == 32
305 return bch_strtouint_h(cp, (unsigned int *) res);
307 return bch_strtoull_h(cp, (unsigned long long *) res);
311 #define strtoi_h(cp, res) \
312 (__builtin_types_compatible_p(typeof(*res), int) \
313 ? bch_strtoint_h(cp, (void *) res) \
314 : __builtin_types_compatible_p(typeof(*res), long) \
315 ? bch_strtol_h(cp, (void *) res) \
316 : __builtin_types_compatible_p(typeof(*res), long long) \
317 ? bch_strtoll_h(cp, (void *) res) \
318 : __builtin_types_compatible_p(typeof(*res), unsigned int) \
319 ? bch_strtouint_h(cp, (void *) res) \
320 : __builtin_types_compatible_p(typeof(*res), unsigned long) \
321 ? bch_strtoul_h(cp, (void *) res) \
322 : __builtin_types_compatible_p(typeof(*res), unsigned long long)\
323 ? bch_strtoull_h(cp, (void *) res) : -EINVAL)
325 #define strtoul_safe(cp, var) \
328 int _r = kstrtoul(cp, 10, &_v); \
334 #define strtoul_safe_clamp(cp, var, min, max) \
337 int _r = kstrtoul(cp, 10, &_v); \
339 var = clamp_t(typeof(var), _v, min, max); \
343 ssize_t bch_hprint(char *buf, int64_t v);
345 bool bch_is_zero(const char *p, size_t n);
346 int bch_parse_uuid(const char *s, char *uuid);
351 * all fields are in nanoseconds, averages are ewmas stored left shifted
354 uint64_t max_duration;
355 uint64_t average_duration;
356 uint64_t average_frequency;
360 void bch_time_stats_update(struct time_stats *stats, uint64_t time);
362 static inline unsigned int local_clock_us(void)
364 return local_clock() >> 10;
367 #define NSEC_PER_ns 1L
368 #define NSEC_PER_us NSEC_PER_USEC
369 #define NSEC_PER_ms NSEC_PER_MSEC
370 #define NSEC_PER_sec NSEC_PER_SEC
372 #define __print_time_stat(stats, name, stat, units) \
373 sysfs_print(name ## _ ## stat ## _ ## units, \
374 div_u64((stats)->stat >> 8, NSEC_PER_ ## units))
376 #define sysfs_print_time_stats(stats, name, \
380 __print_time_stat(stats, name, \
381 average_frequency, frequency_units); \
382 __print_time_stat(stats, name, \
383 average_duration, duration_units); \
384 sysfs_print(name ## _ ##max_duration ## _ ## duration_units, \
385 div_u64((stats)->max_duration, \
386 NSEC_PER_ ## duration_units)); \
388 sysfs_print(name ## _last_ ## frequency_units, (stats)->last \
389 ? div_s64(local_clock() - (stats)->last, \
390 NSEC_PER_ ## frequency_units) \
394 #define sysfs_time_stats_attribute(name, \
397 read_attribute(name ## _average_frequency_ ## frequency_units); \
398 read_attribute(name ## _average_duration_ ## duration_units); \
399 read_attribute(name ## _max_duration_ ## duration_units); \
400 read_attribute(name ## _last_ ## frequency_units)
402 #define sysfs_time_stats_attribute_list(name, \
405 &sysfs_ ## name ## _average_frequency_ ## frequency_units, \
406 &sysfs_ ## name ## _average_duration_ ## duration_units, \
407 &sysfs_ ## name ## _max_duration_ ## duration_units, \
408 &sysfs_ ## name ## _last_ ## frequency_units,
410 #define ewma_add(ewma, val, weight, factor) \
412 (ewma) *= (weight) - 1; \
413 (ewma) += (val) << factor; \
414 (ewma) /= (weight); \
418 struct bch_ratelimit {
419 /* Next time we want to do some work, in nanoseconds */
423 * Rate at which we want to do work, in units per second
424 * The units here correspond to the units passed to bch_next_delay()
429 static inline void bch_ratelimit_reset(struct bch_ratelimit *d)
431 d->next = local_clock();
434 uint64_t bch_next_delay(struct bch_ratelimit *d, uint64_t done);
436 #define __DIV_SAFE(n, d, zero) \
438 typeof(n) _n = (n); \
439 typeof(d) _d = (d); \
440 _d ? _n / _d : zero; \
443 #define DIV_SAFE(n, d) __DIV_SAFE(n, d, 0)
445 #define container_of_or_null(ptr, type, member) \
447 typeof(ptr) _ptr = ptr; \
448 _ptr ? container_of(_ptr, type, member) : NULL; \
451 #define RB_INSERT(root, new, member, cmp) \
454 struct rb_node **n = &(root)->rb_node, *parent = NULL; \
460 this = container_of(*n, typeof(*(new)), member); \
461 res = cmp(new, this); \
469 rb_link_node(&(new)->member, parent, n); \
470 rb_insert_color(&(new)->member, root); \
476 #define RB_SEARCH(root, search, member, cmp) \
478 struct rb_node *n = (root)->rb_node; \
479 typeof(&(search)) this, ret = NULL; \
483 this = container_of(n, typeof(search), member); \
484 res = cmp(&(search), this); \
496 #define RB_GREATER(root, search, member, cmp) \
498 struct rb_node *n = (root)->rb_node; \
499 typeof(&(search)) this, ret = NULL; \
503 this = container_of(n, typeof(search), member); \
504 res = cmp(&(search), this); \
514 #define RB_FIRST(root, type, member) \
515 container_of_or_null(rb_first(root), type, member)
517 #define RB_LAST(root, type, member) \
518 container_of_or_null(rb_last(root), type, member)
520 #define RB_NEXT(ptr, member) \
521 container_of_or_null(rb_next(&(ptr)->member), typeof(*ptr), member)
523 #define RB_PREV(ptr, member) \
524 container_of_or_null(rb_prev(&(ptr)->member), typeof(*ptr), member)
526 static inline uint64_t bch_crc64(const void *p, size_t len)
528 uint64_t crc = 0xffffffffffffffffULL;
530 crc = crc64_be(crc, p, len);
531 return crc ^ 0xffffffffffffffffULL;
535 * A stepwise-linear pseudo-exponential. This returns 1 << (x >>
536 * frac_bits), with the less-significant bits filled in by linear
539 * This can also be interpreted as a floating-point number format,
540 * where the low frac_bits are the mantissa (with implicit leading
541 * 1 bit), and the more significant bits are the exponent.
542 * The return value is 1.mantissa * 2^exponent.
544 * The way this is used, fract_bits is 6 and the largest possible
545 * input is CONGESTED_MAX-1 = 1023 (exponent 16, mantissa 0x1.fc),
546 * so the maximum output is 0x1fc00.
548 static inline unsigned int fract_exp_two(unsigned int x,
549 unsigned int fract_bits)
551 unsigned int mantissa = 1 << fract_bits; /* Implicit bit */
553 mantissa += x & (mantissa - 1);
554 x >>= fract_bits; /* The exponent */
555 /* Largest intermediate value 0x7f0000 */
556 return mantissa << x >> fract_bits;
559 void bch_bio_map(struct bio *bio, void *base);
560 int bch_bio_alloc_pages(struct bio *bio, gfp_t gfp_mask);
562 #endif /* _BCACHE_UTIL_H */