Fix: ACCESS_ONCE() removed in kernel 4.15
[lttng-modules.git] / lib / ringbuffer / backend.h
CommitLineData
886d51a3
MD
1#ifndef _LIB_RING_BUFFER_BACKEND_H
2#define _LIB_RING_BUFFER_BACKEND_H
f3bc08c5
MD
3
4/*
886d51a3 5 * lib/ringbuffer/backend.h
f3bc08c5
MD
6 *
7 * Ring buffer backend (API).
8 *
886d51a3
MD
9 * Copyright (C) 2010-2012 Mathieu Desnoyers <mathieu.desnoyers@efficios.com>
10 *
11 * This library is free software; you can redistribute it and/or
12 * modify it under the terms of the GNU Lesser General Public
13 * License as published by the Free Software Foundation; only
14 * version 2.1 of the License.
15 *
16 * This library is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
19 * Lesser General Public License for more details.
20 *
21 * You should have received a copy of the GNU Lesser General Public
22 * License along with this library; if not, write to the Free Software
23 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
f3bc08c5
MD
24 *
25 * Credits to Steven Rostedt for proposing to use an extra-subbuffer owned by
26 * the reader in flight recorder mode.
27 */
28
29#include <linux/types.h>
30#include <linux/sched.h>
31#include <linux/timer.h>
32#include <linux/wait.h>
33#include <linux/poll.h>
34#include <linux/list.h>
35#include <linux/fs.h>
36#include <linux/mm.h>
7b8ea3a5 37#include <linux/uaccess.h>
f3bc08c5
MD
38
39/* Internal helpers */
5671a661
MD
40#include <wrapper/ringbuffer/backend_internal.h>
41#include <wrapper/ringbuffer/frontend_internal.h>
f3bc08c5
MD
42
43/* Ring buffer backend API */
44
45/* Ring buffer backend access (read/write) */
46
47extern size_t lib_ring_buffer_read(struct lib_ring_buffer_backend *bufb,
48 size_t offset, void *dest, size_t len);
49
50extern int __lib_ring_buffer_copy_to_user(struct lib_ring_buffer_backend *bufb,
51 size_t offset, void __user *dest,
52 size_t len);
53
54extern int lib_ring_buffer_read_cstr(struct lib_ring_buffer_backend *bufb,
55 size_t offset, void *dest, size_t len);
56
0112cb7b
MD
57extern unsigned long *
58lib_ring_buffer_read_get_pfn(struct lib_ring_buffer_backend *bufb, size_t offset,
f3bc08c5
MD
59 void ***virt);
60
61/*
62 * Return the address where a given offset is located.
63 * Should be used to get the current subbuffer header pointer. Given we know
64 * it's never on a page boundary, it's safe to write directly to this address,
65 * as long as the write is never bigger than a page size.
66 */
67extern void *
68lib_ring_buffer_offset_address(struct lib_ring_buffer_backend *bufb,
69 size_t offset);
70extern void *
71lib_ring_buffer_read_offset_address(struct lib_ring_buffer_backend *bufb,
72 size_t offset);
73
74/**
75 * lib_ring_buffer_write - write data to a buffer backend
76 * @config : ring buffer instance configuration
77 * @ctx: ring buffer context. (input arguments only)
78 * @src : source pointer to copy from
79 * @len : length of data to copy
80 *
81 * This function copies "len" bytes of data from a source pointer to a buffer
82 * backend, at the current context offset. This is more or less a buffer
83 * backend-specific memcpy() operation. Calls the slow path (_ring_buffer_write)
84 * if copy is crossing a page boundary.
85 */
8617eb9a 86static inline __attribute__((always_inline))
f3bc08c5
MD
87void lib_ring_buffer_write(const struct lib_ring_buffer_config *config,
88 struct lib_ring_buffer_ctx *ctx,
89 const void *src, size_t len)
90{
91 struct lib_ring_buffer_backend *bufb = &ctx->buf->backend;
92 struct channel_backend *chanb = &ctx->chan->backend;
85a07c33 93 size_t index, pagecpy;
f3bc08c5 94 size_t offset = ctx->buf_offset;
85a07c33 95 struct lib_ring_buffer_backend_pages *backend_pages;
f3bc08c5 96
61eb4c39
MD
97 if (unlikely(!len))
98 return;
85a07c33
MD
99 backend_pages =
100 lib_ring_buffer_get_backend_pages_from_ctx(config, ctx);
f3bc08c5 101 offset &= chanb->buf_size - 1;
f3bc08c5
MD
102 index = (offset & (chanb->subbuf_size - 1)) >> PAGE_SHIFT;
103 pagecpy = min_t(size_t, len, (-offset) & ~PAGE_MASK);
f3bc08c5
MD
104 if (likely(pagecpy == len))
105 lib_ring_buffer_do_copy(config,
85a07c33 106 backend_pages->p[index].virt
f3bc08c5
MD
107 + (offset & ~PAGE_MASK),
108 src, len);
109 else
110 _lib_ring_buffer_write(bufb, offset, src, len, 0);
111 ctx->buf_offset += len;
112}
113
4ea00e4f
JD
114/**
115 * lib_ring_buffer_memset - write len bytes of c to a buffer backend
116 * @config : ring buffer instance configuration
117 * @bufb : ring buffer backend
118 * @offset : offset within the buffer
119 * @c : the byte to copy
120 * @len : number of bytes to copy
121 *
122 * This function writes "len" bytes of "c" to a buffer backend, at a specific
123 * offset. This is more or less a buffer backend-specific memset() operation.
124 * Calls the slow path (_ring_buffer_memset) if write is crossing a page
125 * boundary.
126 */
127static inline
128void lib_ring_buffer_memset(const struct lib_ring_buffer_config *config,
129 struct lib_ring_buffer_ctx *ctx, int c, size_t len)
130{
131
132 struct lib_ring_buffer_backend *bufb = &ctx->buf->backend;
133 struct channel_backend *chanb = &ctx->chan->backend;
85a07c33 134 size_t index, pagecpy;
4ea00e4f 135 size_t offset = ctx->buf_offset;
85a07c33 136 struct lib_ring_buffer_backend_pages *backend_pages;
4ea00e4f 137
61eb4c39
MD
138 if (unlikely(!len))
139 return;
85a07c33
MD
140 backend_pages =
141 lib_ring_buffer_get_backend_pages_from_ctx(config, ctx);
4ea00e4f 142 offset &= chanb->buf_size - 1;
4ea00e4f
JD
143 index = (offset & (chanb->subbuf_size - 1)) >> PAGE_SHIFT;
144 pagecpy = min_t(size_t, len, (-offset) & ~PAGE_MASK);
4ea00e4f 145 if (likely(pagecpy == len))
85a07c33 146 lib_ring_buffer_do_memset(backend_pages->p[index].virt
4ea00e4f
JD
147 + (offset & ~PAGE_MASK),
148 c, len);
149 else
150 _lib_ring_buffer_memset(bufb, offset, c, len, 0);
151 ctx->buf_offset += len;
152}
153
16f78f3a
MD
154/*
155 * Copy up to @len string bytes from @src to @dest. Stop whenever a NULL
156 * terminating character is found in @src. Returns the number of bytes
157 * copied. Does *not* terminate @dest with NULL terminating character.
158 */
d723e905 159static inline __attribute__((always_inline))
16f78f3a
MD
160size_t lib_ring_buffer_do_strcpy(const struct lib_ring_buffer_config *config,
161 char *dest, const char *src, size_t len)
162{
163 size_t count;
164
165 for (count = 0; count < len; count++) {
166 char c;
167
168 /*
169 * Only read source character once, in case it is
170 * modified concurrently.
171 */
a8f2d0c7 172 c = READ_ONCE(src[count]);
16f78f3a
MD
173 if (!c)
174 break;
175 lib_ring_buffer_do_copy(config, &dest[count], &c, 1);
176 }
177 return count;
178}
179
180/*
181 * Copy up to @len string bytes from @src to @dest. Stop whenever a NULL
182 * terminating character is found in @src, or when a fault occurs.
183 * Returns the number of bytes copied. Does *not* terminate @dest with
184 * NULL terminating character.
185 *
186 * This function deals with userspace pointers, it should never be called
187 * directly without having the src pointer checked with access_ok()
188 * previously.
189 */
d723e905 190static inline __attribute__((always_inline))
16f78f3a
MD
191size_t lib_ring_buffer_do_strcpy_from_user_inatomic(const struct lib_ring_buffer_config *config,
192 char *dest, const char __user *src, size_t len)
193{
194 size_t count;
195
196 for (count = 0; count < len; count++) {
197 int ret;
198 char c;
199
f127e61e 200 ret = __copy_from_user_inatomic(&c, src + count, 1);
16f78f3a
MD
201 if (ret || !c)
202 break;
203 lib_ring_buffer_do_copy(config, &dest[count], &c, 1);
204 }
205 return count;
206}
207
208/**
209 * lib_ring_buffer_strcpy - write string data to a buffer backend
210 * @config : ring buffer instance configuration
211 * @ctx: ring buffer context. (input arguments only)
212 * @src : source pointer to copy from
213 * @len : length of data to copy
214 * @pad : character to use for padding
215 *
216 * This function copies @len - 1 bytes of string data from a source
217 * pointer to a buffer backend, followed by a terminating '\0'
218 * character, at the current context offset. This is more or less a
219 * buffer backend-specific strncpy() operation. If a terminating '\0'
220 * character is found in @src before @len - 1 characters are copied, pad
221 * the buffer with @pad characters (e.g. '#'). Calls the slow path
222 * (_ring_buffer_strcpy) if copy is crossing a page boundary.
223 */
224static inline
225void lib_ring_buffer_strcpy(const struct lib_ring_buffer_config *config,
226 struct lib_ring_buffer_ctx *ctx,
227 const char *src, size_t len, int pad)
228{
229 struct lib_ring_buffer_backend *bufb = &ctx->buf->backend;
230 struct channel_backend *chanb = &ctx->chan->backend;
85a07c33 231 size_t index, pagecpy;
16f78f3a 232 size_t offset = ctx->buf_offset;
85a07c33 233 struct lib_ring_buffer_backend_pages *backend_pages;
16f78f3a
MD
234
235 if (unlikely(!len))
236 return;
85a07c33
MD
237 backend_pages =
238 lib_ring_buffer_get_backend_pages_from_ctx(config, ctx);
16f78f3a 239 offset &= chanb->buf_size - 1;
16f78f3a
MD
240 index = (offset & (chanb->subbuf_size - 1)) >> PAGE_SHIFT;
241 pagecpy = min_t(size_t, len, (-offset) & ~PAGE_MASK);
16f78f3a
MD
242 if (likely(pagecpy == len)) {
243 size_t count;
244
245 count = lib_ring_buffer_do_strcpy(config,
85a07c33 246 backend_pages->p[index].virt
16f78f3a
MD
247 + (offset & ~PAGE_MASK),
248 src, len - 1);
249 offset += count;
250 /* Padding */
251 if (unlikely(count < len - 1)) {
252 size_t pad_len = len - 1 - count;
253
85a07c33 254 lib_ring_buffer_do_memset(backend_pages->p[index].virt
16f78f3a
MD
255 + (offset & ~PAGE_MASK),
256 pad, pad_len);
257 offset += pad_len;
258 }
259 /* Ending '\0' */
85a07c33 260 lib_ring_buffer_do_memset(backend_pages->p[index].virt
16f78f3a
MD
261 + (offset & ~PAGE_MASK),
262 '\0', 1);
263 } else {
264 _lib_ring_buffer_strcpy(bufb, offset, src, len, 0, pad);
265 }
266 ctx->buf_offset += len;
267}
268
4ea00e4f 269/**
7b8ea3a5 270 * lib_ring_buffer_copy_from_user_inatomic - write userspace data to a buffer backend
4ea00e4f
JD
271 * @config : ring buffer instance configuration
272 * @ctx: ring buffer context. (input arguments only)
273 * @src : userspace source pointer to copy from
274 * @len : length of data to copy
275 *
276 * This function copies "len" bytes of data from a userspace pointer to a
277 * buffer backend, at the current context offset. This is more or less a buffer
278 * backend-specific memcpy() operation. Calls the slow path
7b8ea3a5
MD
279 * (_ring_buffer_write_from_user_inatomic) if copy is crossing a page boundary.
280 * Disable the page fault handler to ensure we never try to take the mmap_sem.
4ea00e4f 281 */
d723e905 282static inline __attribute__((always_inline))
7b8ea3a5 283void lib_ring_buffer_copy_from_user_inatomic(const struct lib_ring_buffer_config *config,
4ea00e4f
JD
284 struct lib_ring_buffer_ctx *ctx,
285 const void __user *src, size_t len)
286{
287 struct lib_ring_buffer_backend *bufb = &ctx->buf->backend;
288 struct channel_backend *chanb = &ctx->chan->backend;
85a07c33 289 size_t index, pagecpy;
4ea00e4f 290 size_t offset = ctx->buf_offset;
85a07c33 291 struct lib_ring_buffer_backend_pages *backend_pages;
4ea00e4f 292 unsigned long ret;
7b8ea3a5 293 mm_segment_t old_fs = get_fs();
4ea00e4f 294
61eb4c39
MD
295 if (unlikely(!len))
296 return;
85a07c33
MD
297 backend_pages =
298 lib_ring_buffer_get_backend_pages_from_ctx(config, ctx);
4ea00e4f 299 offset &= chanb->buf_size - 1;
4ea00e4f
JD
300 index = (offset & (chanb->subbuf_size - 1)) >> PAGE_SHIFT;
301 pagecpy = min_t(size_t, len, (-offset) & ~PAGE_MASK);
4ea00e4f 302
7b8ea3a5
MD
303 set_fs(KERNEL_DS);
304 pagefault_disable();
4ea00e4f
JD
305 if (unlikely(!access_ok(VERIFY_READ, src, len)))
306 goto fill_buffer;
307
308 if (likely(pagecpy == len)) {
7b8ea3a5 309 ret = lib_ring_buffer_do_copy_from_user_inatomic(
85a07c33 310 backend_pages->p[index].virt + (offset & ~PAGE_MASK),
4ea00e4f
JD
311 src, len);
312 if (unlikely(ret > 0)) {
d87a9f03 313 /* Copy failed. */
4ea00e4f
JD
314 goto fill_buffer;
315 }
316 } else {
7b8ea3a5 317 _lib_ring_buffer_copy_from_user_inatomic(bufb, offset, src, len, 0);
4ea00e4f 318 }
7b8ea3a5
MD
319 pagefault_enable();
320 set_fs(old_fs);
4ea00e4f
JD
321 ctx->buf_offset += len;
322
323 return;
324
325fill_buffer:
7b8ea3a5
MD
326 pagefault_enable();
327 set_fs(old_fs);
4ea00e4f
JD
328 /*
329 * In the error path we call the slow path version to avoid
330 * the pollution of static inline code.
331 */
332 _lib_ring_buffer_memset(bufb, offset, 0, len, 0);
333}
334
16f78f3a
MD
335/**
336 * lib_ring_buffer_strcpy_from_user_inatomic - write userspace string data to a buffer backend
337 * @config : ring buffer instance configuration
338 * @ctx: ring buffer context (input arguments only)
339 * @src : userspace source pointer to copy from
340 * @len : length of data to copy
341 * @pad : character to use for padding
342 *
343 * This function copies @len - 1 bytes of string data from a userspace
344 * source pointer to a buffer backend, followed by a terminating '\0'
345 * character, at the current context offset. This is more or less a
346 * buffer backend-specific strncpy() operation. If a terminating '\0'
347 * character is found in @src before @len - 1 characters are copied, pad
348 * the buffer with @pad characters (e.g. '#'). Calls the slow path
349 * (_ring_buffer_strcpy_from_user_inatomic) if copy is crossing a page
350 * boundary. Disable the page fault handler to ensure we never try to
351 * take the mmap_sem.
352 */
353static inline
354void lib_ring_buffer_strcpy_from_user_inatomic(const struct lib_ring_buffer_config *config,
355 struct lib_ring_buffer_ctx *ctx,
356 const void __user *src, size_t len, int pad)
357{
358 struct lib_ring_buffer_backend *bufb = &ctx->buf->backend;
359 struct channel_backend *chanb = &ctx->chan->backend;
85a07c33 360 size_t index, pagecpy;
16f78f3a 361 size_t offset = ctx->buf_offset;
85a07c33 362 struct lib_ring_buffer_backend_pages *backend_pages;
16f78f3a
MD
363 mm_segment_t old_fs = get_fs();
364
365 if (unlikely(!len))
366 return;
85a07c33
MD
367 backend_pages =
368 lib_ring_buffer_get_backend_pages_from_ctx(config, ctx);
16f78f3a 369 offset &= chanb->buf_size - 1;
16f78f3a
MD
370 index = (offset & (chanb->subbuf_size - 1)) >> PAGE_SHIFT;
371 pagecpy = min_t(size_t, len, (-offset) & ~PAGE_MASK);
16f78f3a
MD
372
373 set_fs(KERNEL_DS);
374 pagefault_disable();
375 if (unlikely(!access_ok(VERIFY_READ, src, len)))
376 goto fill_buffer;
377
378 if (likely(pagecpy == len)) {
379 size_t count;
380
381 count = lib_ring_buffer_do_strcpy_from_user_inatomic(config,
85a07c33 382 backend_pages->p[index].virt
16f78f3a
MD
383 + (offset & ~PAGE_MASK),
384 src, len - 1);
385 offset += count;
386 /* Padding */
387 if (unlikely(count < len - 1)) {
388 size_t pad_len = len - 1 - count;
389
85a07c33 390 lib_ring_buffer_do_memset(backend_pages->p[index].virt
16f78f3a
MD
391 + (offset & ~PAGE_MASK),
392 pad, pad_len);
393 offset += pad_len;
394 }
395 /* Ending '\0' */
85a07c33 396 lib_ring_buffer_do_memset(backend_pages->p[index].virt
16f78f3a
MD
397 + (offset & ~PAGE_MASK),
398 '\0', 1);
399 } else {
400 _lib_ring_buffer_strcpy_from_user_inatomic(bufb, offset, src,
401 len, 0, pad);
402 }
403 pagefault_enable();
404 set_fs(old_fs);
405 ctx->buf_offset += len;
406
407 return;
408
409fill_buffer:
410 pagefault_enable();
411 set_fs(old_fs);
412 /*
413 * In the error path we call the slow path version to avoid
414 * the pollution of static inline code.
415 */
416 _lib_ring_buffer_memset(bufb, offset, pad, len - 1, 0);
417 offset += len - 1;
418 _lib_ring_buffer_memset(bufb, offset, '\0', 1, 0);
419}
420
f3bc08c5
MD
421/*
422 * This accessor counts the number of unread records in a buffer.
423 * It only provides a consistent value if no reads not writes are performed
424 * concurrently.
425 */
426static inline
427unsigned long lib_ring_buffer_get_records_unread(
428 const struct lib_ring_buffer_config *config,
429 struct lib_ring_buffer *buf)
430{
431 struct lib_ring_buffer_backend *bufb = &buf->backend;
432 struct lib_ring_buffer_backend_pages *pages;
433 unsigned long records_unread = 0, sb_bindex, id;
434 unsigned int i;
435
436 for (i = 0; i < bufb->chan->backend.num_subbuf; i++) {
437 id = bufb->buf_wsb[i].id;
438 sb_bindex = subbuffer_id_get_index(config, id);
439 pages = bufb->array[sb_bindex];
440 records_unread += v_read(config, &pages->records_unread);
441 }
442 if (config->mode == RING_BUFFER_OVERWRITE) {
443 id = bufb->buf_rsb.id;
444 sb_bindex = subbuffer_id_get_index(config, id);
445 pages = bufb->array[sb_bindex];
446 records_unread += v_read(config, &pages->records_unread);
447 }
448 return records_unread;
449}
450
3c8ebbc8
MD
451/*
452 * We use __copy_from_user_inatomic to copy userspace data after
453 * checking with access_ok() and disabling page faults.
454 *
455 * Return 0 if OK, nonzero on error.
456 */
457static inline
458unsigned long lib_ring_buffer_copy_from_user_check_nofault(void *dest,
459 const void __user *src,
460 unsigned long len)
461{
462 unsigned long ret;
463 mm_segment_t old_fs;
464
465 if (!access_ok(VERIFY_READ, src, len))
466 return 1;
467 old_fs = get_fs();
468 set_fs(KERNEL_DS);
469 pagefault_disable();
470 ret = __copy_from_user_inatomic(dest, src, len);
471 pagefault_enable();
472 set_fs(old_fs);
473 return ret;
474}
475
886d51a3 476#endif /* _LIB_RING_BUFFER_BACKEND_H */
This page took 0.052009 seconds and 4 git commands to generate.