ptr_ring.h 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487
  1. /*
  2. * Definitions for the 'struct ptr_ring' datastructure.
  3. *
  4. * Author:
  5. * Michael S. Tsirkin <mst@redhat.com>
  6. *
  7. * Copyright (C) 2016 Red Hat, Inc.
  8. *
  9. * This program is free software; you can redistribute it and/or modify it
  10. * under the terms of the GNU General Public License as published by the
  11. * Free Software Foundation; either version 2 of the License, or (at your
  12. * option) any later version.
  13. *
  14. * This is a limited-size FIFO maintaining pointers in FIFO order, with
  15. * one CPU producing entries and another consuming entries from a FIFO.
  16. *
  17. * This implementation tries to minimize cache-contention when there is a
  18. * single producer and a single consumer CPU.
  19. */
  20. #ifndef _LINUX_PTR_RING_H
  21. #define _LINUX_PTR_RING_H 1
  22. #ifdef __KERNEL__
  23. #include <linux/spinlock.h>
  24. #include <linux/cache.h>
  25. #include <linux/types.h>
  26. #include <linux/compiler.h>
  27. #include <linux/cache.h>
  28. #include <linux/slab.h>
  29. #include <asm/errno.h>
  30. #endif
  31. struct ptr_ring {
  32. int producer ____cacheline_aligned_in_smp;
  33. spinlock_t producer_lock;
  34. int consumer ____cacheline_aligned_in_smp;
  35. spinlock_t consumer_lock;
  36. /* Shared consumer/producer data */
  37. /* Read-only by both the producer and the consumer */
  38. int size ____cacheline_aligned_in_smp; /* max entries in queue */
  39. void **queue;
  40. };
  41. /* Note: callers invoking this in a loop must use a compiler barrier,
  42. * for example cpu_relax(). If ring is ever resized, callers must hold
  43. * producer_lock - see e.g. ptr_ring_full. Otherwise, if callers don't hold
  44. * producer_lock, the next call to __ptr_ring_produce may fail.
  45. */
  46. static inline bool __ptr_ring_full(struct ptr_ring *r)
  47. {
  48. return r->queue[r->producer];
  49. }
  50. static inline bool ptr_ring_full(struct ptr_ring *r)
  51. {
  52. bool ret;
  53. spin_lock(&r->producer_lock);
  54. ret = __ptr_ring_full(r);
  55. spin_unlock(&r->producer_lock);
  56. return ret;
  57. }
  58. static inline bool ptr_ring_full_irq(struct ptr_ring *r)
  59. {
  60. bool ret;
  61. spin_lock_irq(&r->producer_lock);
  62. ret = __ptr_ring_full(r);
  63. spin_unlock_irq(&r->producer_lock);
  64. return ret;
  65. }
  66. static inline bool ptr_ring_full_any(struct ptr_ring *r)
  67. {
  68. unsigned long flags;
  69. bool ret;
  70. spin_lock_irqsave(&r->producer_lock, flags);
  71. ret = __ptr_ring_full(r);
  72. spin_unlock_irqrestore(&r->producer_lock, flags);
  73. return ret;
  74. }
  75. static inline bool ptr_ring_full_bh(struct ptr_ring *r)
  76. {
  77. bool ret;
  78. spin_lock_bh(&r->producer_lock);
  79. ret = __ptr_ring_full(r);
  80. spin_unlock_bh(&r->producer_lock);
  81. return ret;
  82. }
  83. /* Note: callers invoking this in a loop must use a compiler barrier,
  84. * for example cpu_relax(). Callers must hold producer_lock.
  85. * Callers are responsible for making sure pointer that is being queued
  86. * points to a valid data.
  87. */
  88. static inline int __ptr_ring_produce(struct ptr_ring *r, void *ptr)
  89. {
  90. if (unlikely(!r->size) || r->queue[r->producer])
  91. return -ENOSPC;
  92. /* Make sure the pointer we are storing points to a valid data. */
  93. /* Pairs with smp_read_barrier_depends in __ptr_ring_consume. */
  94. smp_wmb();
  95. r->queue[r->producer++] = ptr;
  96. if (unlikely(r->producer >= r->size))
  97. r->producer = 0;
  98. return 0;
  99. }
  100. /*
  101. * Note: resize (below) nests producer lock within consumer lock, so if you
  102. * consume in interrupt or BH context, you must disable interrupts/BH when
  103. * calling this.
  104. */
  105. static inline int ptr_ring_produce(struct ptr_ring *r, void *ptr)
  106. {
  107. int ret;
  108. spin_lock(&r->producer_lock);
  109. ret = __ptr_ring_produce(r, ptr);
  110. spin_unlock(&r->producer_lock);
  111. return ret;
  112. }
  113. static inline int ptr_ring_produce_irq(struct ptr_ring *r, void *ptr)
  114. {
  115. int ret;
  116. spin_lock_irq(&r->producer_lock);
  117. ret = __ptr_ring_produce(r, ptr);
  118. spin_unlock_irq(&r->producer_lock);
  119. return ret;
  120. }
  121. static inline int ptr_ring_produce_any(struct ptr_ring *r, void *ptr)
  122. {
  123. unsigned long flags;
  124. int ret;
  125. spin_lock_irqsave(&r->producer_lock, flags);
  126. ret = __ptr_ring_produce(r, ptr);
  127. spin_unlock_irqrestore(&r->producer_lock, flags);
  128. return ret;
  129. }
  130. static inline int ptr_ring_produce_bh(struct ptr_ring *r, void *ptr)
  131. {
  132. int ret;
  133. spin_lock_bh(&r->producer_lock);
  134. ret = __ptr_ring_produce(r, ptr);
  135. spin_unlock_bh(&r->producer_lock);
  136. return ret;
  137. }
  138. /* Note: callers invoking this in a loop must use a compiler barrier,
  139. * for example cpu_relax(). Callers must take consumer_lock
  140. * if they dereference the pointer - see e.g. PTR_RING_PEEK_CALL.
  141. * If ring is never resized, and if the pointer is merely
  142. * tested, there's no need to take the lock - see e.g. __ptr_ring_empty.
  143. */
  144. static inline void *__ptr_ring_peek(struct ptr_ring *r)
  145. {
  146. if (likely(r->size))
  147. return r->queue[r->consumer];
  148. return NULL;
  149. }
  150. /* Note: callers invoking this in a loop must use a compiler barrier,
  151. * for example cpu_relax(). Callers must take consumer_lock
  152. * if the ring is ever resized - see e.g. ptr_ring_empty.
  153. */
  154. static inline bool __ptr_ring_empty(struct ptr_ring *r)
  155. {
  156. return !__ptr_ring_peek(r);
  157. }
  158. static inline bool ptr_ring_empty(struct ptr_ring *r)
  159. {
  160. bool ret;
  161. spin_lock(&r->consumer_lock);
  162. ret = __ptr_ring_empty(r);
  163. spin_unlock(&r->consumer_lock);
  164. return ret;
  165. }
  166. static inline bool ptr_ring_empty_irq(struct ptr_ring *r)
  167. {
  168. bool ret;
  169. spin_lock_irq(&r->consumer_lock);
  170. ret = __ptr_ring_empty(r);
  171. spin_unlock_irq(&r->consumer_lock);
  172. return ret;
  173. }
  174. static inline bool ptr_ring_empty_any(struct ptr_ring *r)
  175. {
  176. unsigned long flags;
  177. bool ret;
  178. spin_lock_irqsave(&r->consumer_lock, flags);
  179. ret = __ptr_ring_empty(r);
  180. spin_unlock_irqrestore(&r->consumer_lock, flags);
  181. return ret;
  182. }
  183. static inline bool ptr_ring_empty_bh(struct ptr_ring *r)
  184. {
  185. bool ret;
  186. spin_lock_bh(&r->consumer_lock);
  187. ret = __ptr_ring_empty(r);
  188. spin_unlock_bh(&r->consumer_lock);
  189. return ret;
  190. }
  191. /* Must only be called after __ptr_ring_peek returned !NULL */
  192. static inline void __ptr_ring_discard_one(struct ptr_ring *r)
  193. {
  194. r->queue[r->consumer++] = NULL;
  195. if (unlikely(r->consumer >= r->size))
  196. r->consumer = 0;
  197. }
  198. static inline void *__ptr_ring_consume(struct ptr_ring *r)
  199. {
  200. void *ptr;
  201. ptr = __ptr_ring_peek(r);
  202. if (ptr)
  203. __ptr_ring_discard_one(r);
  204. /* Make sure anyone accessing data through the pointer is up to date. */
  205. /* Pairs with smp_wmb in __ptr_ring_produce. */
  206. smp_read_barrier_depends();
  207. return ptr;
  208. }
  209. /*
  210. * Note: resize (below) nests producer lock within consumer lock, so if you
  211. * call this in interrupt or BH context, you must disable interrupts/BH when
  212. * producing.
  213. */
  214. static inline void *ptr_ring_consume(struct ptr_ring *r)
  215. {
  216. void *ptr;
  217. spin_lock(&r->consumer_lock);
  218. ptr = __ptr_ring_consume(r);
  219. spin_unlock(&r->consumer_lock);
  220. return ptr;
  221. }
  222. static inline void *ptr_ring_consume_irq(struct ptr_ring *r)
  223. {
  224. void *ptr;
  225. spin_lock_irq(&r->consumer_lock);
  226. ptr = __ptr_ring_consume(r);
  227. spin_unlock_irq(&r->consumer_lock);
  228. return ptr;
  229. }
  230. static inline void *ptr_ring_consume_any(struct ptr_ring *r)
  231. {
  232. unsigned long flags;
  233. void *ptr;
  234. spin_lock_irqsave(&r->consumer_lock, flags);
  235. ptr = __ptr_ring_consume(r);
  236. spin_unlock_irqrestore(&r->consumer_lock, flags);
  237. return ptr;
  238. }
  239. static inline void *ptr_ring_consume_bh(struct ptr_ring *r)
  240. {
  241. void *ptr;
  242. spin_lock_bh(&r->consumer_lock);
  243. ptr = __ptr_ring_consume(r);
  244. spin_unlock_bh(&r->consumer_lock);
  245. return ptr;
  246. }
  247. /* Cast to structure type and call a function without discarding from FIFO.
  248. * Function must return a value.
  249. * Callers must take consumer_lock.
  250. */
  251. #define __PTR_RING_PEEK_CALL(r, f) ((f)(__ptr_ring_peek(r)))
  252. #define PTR_RING_PEEK_CALL(r, f) ({ \
  253. typeof((f)(NULL)) __PTR_RING_PEEK_CALL_v; \
  254. \
  255. spin_lock(&(r)->consumer_lock); \
  256. __PTR_RING_PEEK_CALL_v = __PTR_RING_PEEK_CALL(r, f); \
  257. spin_unlock(&(r)->consumer_lock); \
  258. __PTR_RING_PEEK_CALL_v; \
  259. })
  260. #define PTR_RING_PEEK_CALL_IRQ(r, f) ({ \
  261. typeof((f)(NULL)) __PTR_RING_PEEK_CALL_v; \
  262. \
  263. spin_lock_irq(&(r)->consumer_lock); \
  264. __PTR_RING_PEEK_CALL_v = __PTR_RING_PEEK_CALL(r, f); \
  265. spin_unlock_irq(&(r)->consumer_lock); \
  266. __PTR_RING_PEEK_CALL_v; \
  267. })
  268. #define PTR_RING_PEEK_CALL_BH(r, f) ({ \
  269. typeof((f)(NULL)) __PTR_RING_PEEK_CALL_v; \
  270. \
  271. spin_lock_bh(&(r)->consumer_lock); \
  272. __PTR_RING_PEEK_CALL_v = __PTR_RING_PEEK_CALL(r, f); \
  273. spin_unlock_bh(&(r)->consumer_lock); \
  274. __PTR_RING_PEEK_CALL_v; \
  275. })
  276. #define PTR_RING_PEEK_CALL_ANY(r, f) ({ \
  277. typeof((f)(NULL)) __PTR_RING_PEEK_CALL_v; \
  278. unsigned long __PTR_RING_PEEK_CALL_f;\
  279. \
  280. spin_lock_irqsave(&(r)->consumer_lock, __PTR_RING_PEEK_CALL_f); \
  281. __PTR_RING_PEEK_CALL_v = __PTR_RING_PEEK_CALL(r, f); \
  282. spin_unlock_irqrestore(&(r)->consumer_lock, __PTR_RING_PEEK_CALL_f); \
  283. __PTR_RING_PEEK_CALL_v; \
  284. })
  285. static inline void **__ptr_ring_init_queue_alloc(unsigned int size, gfp_t gfp)
  286. {
  287. if (size > KMALLOC_MAX_SIZE / sizeof(void *))
  288. return NULL;
  289. return kcalloc(size, sizeof(void *), gfp);
  290. }
  291. static inline int ptr_ring_init(struct ptr_ring *r, int size, gfp_t gfp)
  292. {
  293. r->queue = __ptr_ring_init_queue_alloc(size, gfp);
  294. if (!r->queue)
  295. return -ENOMEM;
  296. r->size = size;
  297. r->producer = r->consumer = 0;
  298. spin_lock_init(&r->producer_lock);
  299. spin_lock_init(&r->consumer_lock);
  300. return 0;
  301. }
  302. static inline void **__ptr_ring_swap_queue(struct ptr_ring *r, void **queue,
  303. int size, gfp_t gfp,
  304. void (*destroy)(void *))
  305. {
  306. int producer = 0;
  307. void **old;
  308. void *ptr;
  309. while ((ptr = __ptr_ring_consume(r)))
  310. if (producer < size)
  311. queue[producer++] = ptr;
  312. else if (destroy)
  313. destroy(ptr);
  314. r->size = size;
  315. r->producer = producer;
  316. r->consumer = 0;
  317. old = r->queue;
  318. r->queue = queue;
  319. return old;
  320. }
  321. /*
  322. * Note: producer lock is nested within consumer lock, so if you
  323. * resize you must make sure all uses nest correctly.
  324. * In particular if you consume ring in interrupt or BH context, you must
  325. * disable interrupts/BH when doing so.
  326. */
  327. static inline int ptr_ring_resize(struct ptr_ring *r, int size, gfp_t gfp,
  328. void (*destroy)(void *))
  329. {
  330. unsigned long flags;
  331. void **queue = __ptr_ring_init_queue_alloc(size, gfp);
  332. void **old;
  333. if (!queue)
  334. return -ENOMEM;
  335. spin_lock_irqsave(&(r)->consumer_lock, flags);
  336. spin_lock(&(r)->producer_lock);
  337. old = __ptr_ring_swap_queue(r, queue, size, gfp, destroy);
  338. spin_unlock(&(r)->producer_lock);
  339. spin_unlock_irqrestore(&(r)->consumer_lock, flags);
  340. kfree(old);
  341. return 0;
  342. }
  343. /*
  344. * Note: producer lock is nested within consumer lock, so if you
  345. * resize you must make sure all uses nest correctly.
  346. * In particular if you consume ring in interrupt or BH context, you must
  347. * disable interrupts/BH when doing so.
  348. */
  349. static inline int ptr_ring_resize_multiple(struct ptr_ring **rings,
  350. unsigned int nrings,
  351. int size,
  352. gfp_t gfp, void (*destroy)(void *))
  353. {
  354. unsigned long flags;
  355. void ***queues;
  356. int i;
  357. queues = kmalloc_array(nrings, sizeof(*queues), gfp);
  358. if (!queues)
  359. goto noqueues;
  360. for (i = 0; i < nrings; ++i) {
  361. queues[i] = __ptr_ring_init_queue_alloc(size, gfp);
  362. if (!queues[i])
  363. goto nomem;
  364. }
  365. for (i = 0; i < nrings; ++i) {
  366. spin_lock_irqsave(&(rings[i])->consumer_lock, flags);
  367. spin_lock(&(rings[i])->producer_lock);
  368. queues[i] = __ptr_ring_swap_queue(rings[i], queues[i],
  369. size, gfp, destroy);
  370. spin_unlock(&(rings[i])->producer_lock);
  371. spin_unlock_irqrestore(&(rings[i])->consumer_lock, flags);
  372. }
  373. for (i = 0; i < nrings; ++i)
  374. kfree(queues[i]);
  375. kfree(queues);
  376. return 0;
  377. nomem:
  378. while (--i >= 0)
  379. kfree(queues[i]);
  380. kfree(queues);
  381. noqueues:
  382. return -ENOMEM;
  383. }
  384. static inline void ptr_ring_cleanup(struct ptr_ring *r, void (*destroy)(void *))
  385. {
  386. void *ptr;
  387. if (destroy)
  388. while ((ptr = ptr_ring_consume(r)))
  389. destroy(ptr);
  390. kfree(r->queue);
  391. }
  392. #endif /* _LINUX_PTR_RING_H */