2 * Copyright (C) 2020 Francis Deslauriers <francis.deslauriers@efficios.com>
4 * SPDX-License-Identifier: GPL-2.0-only
12 #include <urcu/compiler.h>
15 #include <common/error.h>
16 #include <common/hashtable/hashtable.h>
17 #include <common/index-allocator.h>
18 #include <common/kernel-ctl/kernel-ctl.h>
19 #include <common/shm.h>
20 #include <lttng/trigger/trigger-internal.h>
22 #include "event-notifier-error-accounting.h"
23 #include "lttng-ust-error.h"
26 #define ERROR_COUNTER_INDEX_HT_INITIAL_SIZE 16
28 struct index_ht_entry
{
29 struct lttng_ht_node_u64 node
;
30 uint64_t error_counter_index
;
31 struct rcu_head rcu_head
;
34 struct ust_error_accounting_entry
{
37 struct lttng_ht_node_u64 node
;
38 struct rcu_head rcu_head
;
39 struct lttng_ust_ctl_daemon_counter
*daemon_counter
;
41 * Those `lttng_ust_abi_object_data` are anonymous handles to the
43 * They are only used to be duplicated for each new applications of the
44 * user. To destroy them, call with the `sock` parameter set to -1.
45 * e.g. `lttng_ust_ctl_release_object(-1, data)`;
47 struct lttng_ust_abi_object_data
*counter
;
48 struct lttng_ust_abi_object_data
**cpu_counters
;
49 int nr_counter_cpu_fds
;
52 struct kernel_error_accounting_entry
{
56 static struct kernel_error_accounting_entry kernel_error_accounting_entry
;
58 /* Hashtable mapping uid to error_account_entry. */
59 static struct lttng_ht
*error_counter_uid_ht
;
61 struct error_accounting_state
{
62 struct lttng_index_allocator
*index_allocator
;
63 /* Hashtable mapping event notifier token to index_ht_entry. */
64 struct lttng_ht
*indices_ht
;
65 uint64_t number_indices
;
68 static struct error_accounting_state ust_state
;
69 static struct error_accounting_state kernel_state
;
71 static inline void get_trigger_info_for_log(const struct lttng_trigger
*trigger
,
72 const char **trigger_name
,
73 uid_t
*trigger_owner_uid
)
75 enum lttng_trigger_status trigger_status
;
77 trigger_status
= lttng_trigger_get_name(trigger
, trigger_name
);
78 switch (trigger_status
) {
79 case LTTNG_TRIGGER_STATUS_OK
:
81 case LTTNG_TRIGGER_STATUS_UNSET
:
82 *trigger_name
= "(anonymous)";
88 trigger_status
= lttng_trigger_get_owner_uid(trigger
,
90 LTTNG_ASSERT(trigger_status
== LTTNG_TRIGGER_STATUS_OK
);
94 const char *error_accounting_status_str(
95 enum event_notifier_error_accounting_status status
)
98 case EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
:
100 case EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
:
102 case EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NOT_FOUND
:
104 case EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NOMEM
:
106 case EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NO_INDEX_AVAILABLE
:
107 return "NO_INDEX_AVAILABLE";
108 case EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_APP_DEAD
:
115 #ifdef HAVE_LIBLTTNG_UST_CTL
116 struct event_notifier_counter
{
117 pthread_mutex_t lock
;
121 static struct event_notifier_counter the_event_notifier_counter
;
123 static void free_ust_error_accounting_entry(struct rcu_head
*head
)
126 struct ust_error_accounting_entry
*entry
=
127 caa_container_of(head
, typeof(*entry
), rcu_head
);
129 for (i
= 0; i
< entry
->nr_counter_cpu_fds
; i
++) {
130 lttng_ust_ctl_release_object(-1, entry
->cpu_counters
[i
]);
131 free(entry
->cpu_counters
[i
]);
134 free(entry
->cpu_counters
);
136 lttng_ust_ctl_release_object(-1, entry
->counter
);
137 free(entry
->counter
);
139 lttng_ust_ctl_destroy_counter(entry
->daemon_counter
);
145 bool ust_error_accounting_entry_get(struct ust_error_accounting_entry
*entry
)
147 return urcu_ref_get_unless_zero(&entry
->ref
);
151 void ust_error_accounting_entry_release(struct urcu_ref
*entry_ref
)
153 struct ust_error_accounting_entry
*entry
=
154 container_of(entry_ref
, typeof(*entry
), ref
);
157 cds_lfht_del(error_counter_uid_ht
->ht
, &entry
->node
.node
);
158 call_rcu(&entry
->rcu_head
, free_ust_error_accounting_entry
);
164 void ust_error_accounting_entry_put(struct ust_error_accounting_entry
*entry
)
170 urcu_ref_put(&entry
->ref
, ust_error_accounting_entry_release
);
174 * Put one reference to every UID entries.
177 void put_ref_all_ust_error_accounting_entry(void)
179 struct lttng_ht_iter iter
;
180 struct ust_error_accounting_entry
*uid_entry
;
182 ASSERT_LOCKED(the_event_notifier_counter
.lock
);
185 cds_lfht_for_each_entry(error_counter_uid_ht
->ht
, &iter
.iter
,
186 uid_entry
, node
.node
) {
187 ust_error_accounting_entry_put(uid_entry
);
194 * Get one reference to every UID entries.
197 void get_ref_all_ust_error_accounting_entry(void)
199 struct lttng_ht_iter iter
;
200 struct ust_error_accounting_entry
*uid_entry
;
202 ASSERT_LOCKED(the_event_notifier_counter
.lock
);
205 cds_lfht_for_each_entry(error_counter_uid_ht
->ht
, &iter
.iter
,
206 uid_entry
, node
.node
) {
207 ust_error_accounting_entry_get(uid_entry
);
213 #endif /* HAVE_LIBLTTNG_UST_CTL */
216 enum event_notifier_error_accounting_status
217 init_error_accounting_state(struct error_accounting_state
*state
,
218 uint64_t index_count
)
220 enum event_notifier_error_accounting_status status
;
224 state
->number_indices
= index_count
;
226 state
->index_allocator
= lttng_index_allocator_create(index_count
);
227 if (!state
->index_allocator
) {
228 ERR("Failed to allocate event notifier error counter index allocator");
229 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NOMEM
;
233 state
->indices_ht
= lttng_ht_new(ERROR_COUNTER_INDEX_HT_INITIAL_SIZE
,
235 if (!state
->indices_ht
) {
236 ERR("Failed to allocate error counter indices hash table");
237 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NOMEM
;
238 goto error_indices_ht
;
241 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
245 lttng_index_allocator_destroy(state
->index_allocator
);
246 state
->index_allocator
= NULL
;
252 void fini_error_accounting_state(struct error_accounting_state
*state
)
257 * Will assert if some error counter indices were not released (an
260 lttng_ht_destroy(state
->indices_ht
);
261 lttng_index_allocator_destroy(state
->index_allocator
);
264 enum event_notifier_error_accounting_status
265 event_notifier_error_accounting_init(uint64_t buffer_size_kernel
,
266 uint64_t buffer_size_ust
)
268 enum event_notifier_error_accounting_status status
;
270 status
= init_error_accounting_state(&kernel_state
, buffer_size_kernel
);
271 if (status
!= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
) {
272 ERR("Failed to initialize kernel event notifier accounting state: status = %s",
273 error_accounting_status_str(status
));
277 status
= init_error_accounting_state(&ust_state
, buffer_size_ust
);
278 if (status
!= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
) {
279 ERR("Failed to initialize UST event notifier accounting state: status = %s",
280 error_accounting_status_str(status
));
281 goto error_ust_state
;
284 error_counter_uid_ht
= lttng_ht_new(
285 ERROR_COUNTER_INDEX_HT_INITIAL_SIZE
, LTTNG_HT_TYPE_U64
);
286 if (!error_counter_uid_ht
) {
287 ERR("Failed to allocate UID to error counter accountant hash table");
288 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NOMEM
;
292 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
296 fini_error_accounting_state(&ust_state
);
298 fini_error_accounting_state(&kernel_state
);
304 * Return the error counteur index associated to this event notifier tracer
305 * token. Returns _STATUS_OK if found and _STATUS_NOT_FOUND otherwise.
308 enum event_notifier_error_accounting_status
get_error_counter_index_for_token(
309 struct error_accounting_state
*state
, uint64_t tracer_token
,
310 uint64_t *error_counter_index
)
312 struct lttng_ht_node_u64
*node
;
313 struct lttng_ht_iter iter
;
314 const struct index_ht_entry
*index_entry
;
315 enum event_notifier_error_accounting_status status
;
318 lttng_ht_lookup(state
->indices_ht
, &tracer_token
, &iter
);
319 node
= lttng_ht_iter_get_node_u64(&iter
);
321 index_entry
= caa_container_of(
322 node
, const struct index_ht_entry
, node
);
323 *error_counter_index
= index_entry
->error_counter_index
;
324 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
326 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NOT_FOUND
;
333 #ifdef HAVE_LIBLTTNG_UST_CTL
335 * Find the entry for this app's UID, the caller acquires a reference if the
339 struct ust_error_accounting_entry
*ust_error_accounting_entry_find(
340 struct lttng_ht
*uid_ht
, const struct ust_app
*app
)
342 struct ust_error_accounting_entry
*entry
;
343 struct lttng_ht_node_u64
*node
;
344 struct lttng_ht_iter iter
;
345 uint64_t key
= app
->uid
;
347 lttng_ht_lookup(uid_ht
, &key
, &iter
);
348 node
= lttng_ht_iter_get_node_u64(&iter
);
354 entry
= caa_container_of(node
,
355 struct ust_error_accounting_entry
, node
);
357 got_ref
= ust_error_accounting_entry_get(entry
);
367 * Create the entry for this app's UID, the caller acquires a reference to the
371 struct ust_error_accounting_entry
*ust_error_accounting_entry_create(
372 const struct ust_app
*app
)
374 int i
, ret
, *cpu_counter_fds
= NULL
;
375 struct lttng_ust_ctl_daemon_counter
*daemon_counter
;
376 struct lttng_ust_abi_object_data
*counter
, **cpu_counters
;
377 struct ust_error_accounting_entry
*entry
= NULL
;
378 lttng_ust_ctl_counter_dimension dimension
;
380 dimension
.size
= ust_state
.number_indices
;
381 dimension
.has_underflow
= false;
382 dimension
.has_overflow
= false;
384 if (!ust_app_supports_counters(app
)) {
385 DBG("Refusing to create accounting entry for application (unsupported feature): app name = '%s', app ppid = %d",
386 app
->name
, (int) app
->ppid
);
390 entry
= (ust_error_accounting_entry
*) zmalloc(sizeof(struct ust_error_accounting_entry
));
392 PERROR("Failed to allocate event notifier error acounting entry")
396 urcu_ref_init(&entry
->ref
);
397 entry
->uid
= app
->uid
;
398 entry
->nr_counter_cpu_fds
= lttng_ust_ctl_get_nr_cpu_per_counter();
400 cpu_counter_fds
= (int *) zmalloc(entry
->nr_counter_cpu_fds
* sizeof(*cpu_counter_fds
));
401 if (!cpu_counter_fds
) {
402 PERROR("Failed to allocate event notifier error counter file descriptors array: application uid = %d, application name = '%s', pid = %d, allocation size = %zu",
403 (int) app
->uid
, app
->name
, (int) app
->pid
,
404 entry
->nr_counter_cpu_fds
* sizeof(*cpu_counter_fds
));
405 goto error_counter_cpu_fds_alloc
;
408 /* Initialize to an invalid fd value to closes fds in case of error. */
409 for (i
= 0; i
< entry
->nr_counter_cpu_fds
; i
++) {
410 cpu_counter_fds
[i
] = -1;
413 cpu_counters
= (lttng_ust_abi_object_data
**) zmalloc(entry
->nr_counter_cpu_fds
* sizeof(struct lttng_ust_abi_object_data
*));
415 PERROR("Failed to allocate event notifier error counter lttng_ust_abi_object_data array: application uid = %d, application name = '%s', pid = %d, allocation size = %zu",
416 (int) app
->uid
, app
->name
, (int) app
->pid
,
417 entry
->nr_counter_cpu_fds
* sizeof(struct lttng_ust_abi_object_data
*));
418 goto error_counter_cpus_alloc
;
421 for (i
= 0; i
< entry
->nr_counter_cpu_fds
; i
++) {
422 cpu_counter_fds
[i
] = shm_create_anonymous("event-notifier-error-accounting");
423 if (cpu_counter_fds
[i
] == -1) {
424 ERR("Failed to create event notifier error accounting shared memory for application user: application uid = %d, pid = %d, application name = '%s'",
425 (int) app
->uid
, (int) app
->pid
, app
->name
);
426 goto error_shm_alloc
;
431 * Ownership of the file descriptors transferred to the ustctl object.
433 daemon_counter
= lttng_ust_ctl_create_counter(1, &dimension
, 0, -1,
434 entry
->nr_counter_cpu_fds
, cpu_counter_fds
,
435 LTTNG_UST_CTL_COUNTER_BITNESS_32
,
436 LTTNG_UST_CTL_COUNTER_ARITHMETIC_MODULAR
,
437 LTTNG_UST_CTL_COUNTER_ALLOC_PER_CPU
,
439 if (!daemon_counter
) {
440 goto error_create_daemon_counter
;
443 ret
= lttng_ust_ctl_create_counter_data(daemon_counter
, &counter
);
445 ERR("Failed to create userspace tracer counter data for application user: uid = %d, pid = %d, application name = '%s'",
446 (int) app
->uid
, (int) app
->pid
, app
->name
);
447 goto error_create_counter_data
;
450 for (i
= 0; i
< entry
->nr_counter_cpu_fds
; i
++) {
451 ret
= lttng_ust_ctl_create_counter_cpu_data(daemon_counter
, i
,
454 ERR("Failed to create userspace tracer counter cpu data for application user: uid = %d, pid = %d, application name = '%s'",
455 (int) app
->uid
, (int) app
->pid
,
457 goto error_create_counter_cpu_data
;
461 entry
->daemon_counter
= daemon_counter
;
462 entry
->counter
= counter
;
463 entry
->cpu_counters
= cpu_counters
;
465 lttng_ht_node_init_u64(&entry
->node
, entry
->uid
);
466 lttng_ht_add_unique_u64(error_counter_uid_ht
, &entry
->node
);
470 error_create_counter_cpu_data
:
471 /* Teardown any allocated cpu counters. */
472 for (i
= 0; i
< entry
->nr_counter_cpu_fds
; i
++) {
473 if (!cpu_counters
[i
]) {
475 * Early-exit when error occurred before all cpu
476 * counters could be initialized.
481 lttng_ust_ctl_release_object(-1, cpu_counters
[i
]);
482 free(cpu_counters
[i
]);
485 lttng_ust_ctl_release_object(-1, entry
->counter
);
486 free(entry
->counter
);
487 error_create_counter_data
:
488 lttng_ust_ctl_destroy_counter(daemon_counter
);
489 error_create_daemon_counter
:
491 /* Error occurred before per-cpu SHMs were handed-off to ustctl. */
492 if (cpu_counter_fds
) {
493 for (i
= 0; i
< entry
->nr_counter_cpu_fds
; i
++) {
494 if (cpu_counter_fds
[i
] < 0) {
496 * Early-exit when error occurred before all cpu
497 * counter shm fds could be initialized.
502 ret
= close(cpu_counter_fds
[i
]);
504 PERROR("Failed to close error counter per-CPU shm file descriptor: fd = %d",
511 error_counter_cpus_alloc
:
512 error_counter_cpu_fds_alloc
:
517 free(cpu_counter_fds
);
522 enum event_notifier_error_accounting_status
send_counter_data_to_ust(
524 struct lttng_ust_abi_object_data
*new_counter
)
527 enum event_notifier_error_accounting_status status
;
529 /* Attach counter to trigger group. */
530 pthread_mutex_lock(&app
->sock_lock
);
531 ret
= lttng_ust_ctl_send_counter_data_to_ust(app
->sock
,
532 app
->event_notifier_group
.object
->handle
, new_counter
);
533 pthread_mutex_unlock(&app
->sock_lock
);
535 if (ret
!= -EPIPE
&& ret
!= -LTTNG_UST_ERR_EXITING
) {
536 ERR("Failed to send counter data to application: application name = '%s', pid = %d, ret = %d",
537 app
->name
, app
->pid
, ret
);
538 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
540 DBG3("Failed to send counter data to application (application is dead): application name = '%s', pid = %d, ret = %d",
541 app
->name
, app
->pid
, ret
);
542 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_APP_DEAD
;
548 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
554 enum event_notifier_error_accounting_status
send_counter_cpu_data_to_ust(
556 struct lttng_ust_abi_object_data
*counter
,
557 struct lttng_ust_abi_object_data
*counter_cpu
)
560 enum event_notifier_error_accounting_status status
;
562 pthread_mutex_lock(&app
->sock_lock
);
563 ret
= lttng_ust_ctl_send_counter_cpu_data_to_ust(app
->sock
,
564 counter
, counter_cpu
);
565 pthread_mutex_unlock(&app
->sock_lock
);
567 if (ret
!= -EPIPE
&& ret
!= -LTTNG_UST_ERR_EXITING
) {
568 ERR("Failed to send counter CPU data to application: application name = '%s', pid = %d, ret = %d",
569 app
->name
, app
->pid
, ret
);
570 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
572 DBG3("Failed to send counter CPU data to application: application name = '%s', pid = %d, ret = %d",
573 app
->name
, app
->pid
, ret
);
574 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_APP_DEAD
;
580 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
585 enum event_notifier_error_accounting_status
586 event_notifier_error_accounting_register_app(struct ust_app
*app
)
590 struct lttng_ust_abi_object_data
*new_counter
;
591 struct ust_error_accounting_entry
*entry
;
592 enum event_notifier_error_accounting_status status
;
593 struct lttng_ust_abi_object_data
**cpu_counters
;
595 if (!ust_app_supports_counters(app
)) {
596 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_UNSUPPORTED
;
601 * Check if we already have a error counter for the user id of this
602 * app. If not, create one.
605 entry
= ust_error_accounting_entry_find(error_counter_uid_ht
, app
);
608 * Take the event notifier counter lock before creating the new
609 * entry to ensure that no event notifier is registered between
610 * the the entry creation and event notifier count check.
612 pthread_mutex_lock(&the_event_notifier_counter
.lock
);
614 entry
= ust_error_accounting_entry_create(app
);
616 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
617 pthread_mutex_unlock(&the_event_notifier_counter
.lock
);
618 goto error_creating_entry
;
622 * We just created a new UID entry, If there are event
623 * notifiers already registered, take one reference on their
626 if (the_event_notifier_counter
.count
> 0) {
627 ust_error_accounting_entry_get(entry
);
630 pthread_mutex_unlock(&the_event_notifier_counter
.lock
);
633 /* Duplicate counter object data. */
634 ret
= lttng_ust_ctl_duplicate_ust_object_data(&new_counter
,
637 ERR("Failed to duplicate event notifier error accounting counter for application user: application uid = %d, pid = %d, application name = '%s'",
638 (int) app
->uid
, (int) app
->pid
, app
->name
);
639 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
640 goto error_duplicate_counter
;
643 status
= send_counter_data_to_ust(app
, new_counter
);
644 if (status
!= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
) {
645 if (status
== EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_APP_DEAD
) {
646 goto error_send_counter_data
;
649 ERR("Failed to send counter data to application tracer: status = %s, application uid = %d, pid = %d, application name = '%s'",
650 error_accounting_status_str(status
),
651 (int) app
->uid
, (int) app
->pid
, app
->name
);
652 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
653 goto error_send_counter_data
;
656 cpu_counters
= (lttng_ust_abi_object_data
**) zmalloc(entry
->nr_counter_cpu_fds
* sizeof(struct lttng_ust_abi_object_data
*));
658 PERROR("Failed to allocate event notifier error counter lttng_ust_abi_object_data array: application uid = %d, application name = '%s', pid = %d, allocation size = %zu",
659 (int) app
->uid
, app
->name
, (int) app
->pid
,
660 entry
->nr_counter_cpu_fds
* sizeof(**cpu_counters
));
661 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NOMEM
;
662 goto error_allocate_cpu_counters
;
665 for (i
= 0; i
< entry
->nr_counter_cpu_fds
; i
++) {
666 struct lttng_ust_abi_object_data
*new_counter_cpu
= NULL
;
668 ret
= lttng_ust_ctl_duplicate_ust_object_data(&new_counter_cpu
,
669 entry
->cpu_counters
[i
]);
671 ERR("Failed to duplicate userspace tracer counter cpu data for application user: uid = %d, pid = %d, application name = '%s'",
672 (int) app
->uid
, (int) app
->pid
,
674 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NOMEM
;
675 goto error_duplicate_cpu_counter
;
678 cpu_counters
[i
] = new_counter_cpu
;
680 status
= send_counter_cpu_data_to_ust(app
, new_counter
,
682 if (status
!= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
) {
683 if (status
== EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_APP_DEAD
) {
684 goto error_send_cpu_counter_data
;
687 ERR("Failed to send counter cpu data to application tracer: status = %s, application uid = %d, pid = %d, application name = '%s'",
688 error_accounting_status_str(status
),
689 (int) app
->uid
, (int) app
->pid
,
691 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
692 goto error_send_cpu_counter_data
;
696 app
->event_notifier_group
.counter
= new_counter
;
698 app
->event_notifier_group
.nr_counter_cpu
= entry
->nr_counter_cpu_fds
;
699 app
->event_notifier_group
.counter_cpu
= cpu_counters
;
703 error_send_cpu_counter_data
:
704 error_duplicate_cpu_counter
:
705 /* Teardown any duplicated cpu counters. */
706 for (i
= 0; i
< entry
->nr_counter_cpu_fds
; i
++) {
707 if (!cpu_counters
[i
]) {
709 * Early-exit when error occurred before all cpu
710 * counters could be initialized.
715 lttng_ust_ctl_release_object(-1, cpu_counters
[i
]);
716 free(cpu_counters
[i
]);
721 error_allocate_cpu_counters
:
722 error_send_counter_data
:
723 lttng_ust_ctl_release_object(-1, new_counter
);
725 error_duplicate_counter
:
726 ust_error_accounting_entry_put(entry
);
727 error_creating_entry
:
728 app
->event_notifier_group
.counter
= NULL
;
735 enum event_notifier_error_accounting_status
736 event_notifier_error_accounting_unregister_app(struct ust_app
*app
)
738 enum event_notifier_error_accounting_status status
;
739 struct ust_error_accounting_entry
*entry
;
744 /* If an error occurred during app registration no entry was created. */
745 if (!app
->event_notifier_group
.counter
) {
746 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
750 entry
= ust_error_accounting_entry_find(error_counter_uid_ht
, app
);
752 ERR("Failed to find event notitifier error accounting entry on application teardown: pid = %d, application name = '%s'",
753 app
->pid
, app
->name
);
754 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
758 * Put the entry twice as we acquired a reference from the
759 * `ust_error_accounting_entry_find()` above.
761 ust_error_accounting_entry_put(entry
);
762 ust_error_accounting_entry_put(entry
);
765 for (i
= 0; i
< app
->event_notifier_group
.nr_counter_cpu
; i
++) {
766 lttng_ust_ctl_release_object(app
->sock
,
767 app
->event_notifier_group
.counter_cpu
[i
]);
768 free(app
->event_notifier_group
.counter_cpu
[i
]);
771 free(app
->event_notifier_group
.counter_cpu
);
773 lttng_ust_ctl_release_object(app
->sock
, app
->event_notifier_group
.counter
);
774 free(app
->event_notifier_group
.counter
);
776 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
783 enum event_notifier_error_accounting_status
784 event_notifier_error_accounting_ust_get_count(
785 const struct lttng_trigger
*trigger
, uint64_t *count
)
787 struct lttng_ht_iter iter
;
788 struct ust_error_accounting_entry
*uid_entry
;
789 uint64_t error_counter_index
, global_sum
= 0;
790 enum event_notifier_error_accounting_status status
;
791 size_t dimension_indexes
[1];
792 const uint64_t tracer_token
= lttng_trigger_get_tracer_token(trigger
);
793 uid_t trigger_owner_uid
;
794 const char *trigger_name
;
799 get_trigger_info_for_log(trigger
, &trigger_name
, &trigger_owner_uid
);
801 status
= get_error_counter_index_for_token(&ust_state
, tracer_token
,
802 &error_counter_index
);
803 if (status
!= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
) {
805 ERR("Failed to retrieve index for tracer token: token = %" PRIu64
", trigger name = '%s', trigger owner uid = %d, status = %s",
806 tracer_token
, trigger_name
,
807 (int) trigger_owner_uid
,
808 error_accounting_status_str(status
));
812 dimension_indexes
[0] = error_counter_index
;
815 * Iterate over all the UID entries.
816 * We aggregate the value of all uid entries regardless of if the uid
817 * matches the trigger's uid because a user that is allowed to register
818 * a trigger to a given sessiond is also allowed to create an event
819 * notifier on all apps that this sessiond is aware of.
821 cds_lfht_for_each_entry(error_counter_uid_ht
->ht
, &iter
.iter
,
822 uid_entry
, node
.node
) {
824 int64_t local_value
= 0;
825 bool overflow
= false, underflow
= false;
827 ret
= lttng_ust_ctl_counter_aggregate(uid_entry
->daemon_counter
,
828 dimension_indexes
, &local_value
, &overflow
,
830 if (ret
|| local_value
< 0) {
832 ERR("Failed to aggregate event notifier error counter values of trigger: trigger name = '%s', trigger owner uid = %d",
834 (int) trigger_owner_uid
);
835 } else if (local_value
< 0) {
836 ERR("Negative event notifier error counter value encountered during aggregation: trigger name = '%s', trigger owner uid = %d, value = %" PRId64
,
838 (int) trigger_owner_uid
,
844 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
848 /* Cast is safe as negative values are checked-for above. */
849 global_sum
+= (uint64_t) local_value
;
853 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
861 enum event_notifier_error_accounting_status
event_notifier_error_accounting_ust_clear(
862 const struct lttng_trigger
*trigger
)
864 struct lttng_ht_iter iter
;
865 struct ust_error_accounting_entry
*uid_entry
;
866 uint64_t error_counter_index
;
867 enum event_notifier_error_accounting_status status
;
868 size_t dimension_index
;
869 const uint64_t tracer_token
= lttng_trigger_get_tracer_token(trigger
);
872 status
= get_error_counter_index_for_token(&ust_state
, tracer_token
,
873 &error_counter_index
);
874 if (status
!= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
) {
875 uid_t trigger_owner_uid
;
876 const char *trigger_name
;
878 get_trigger_info_for_log(trigger
, &trigger_name
,
881 ERR("Failed to retrieve index for tracer token: token = %" PRIu64
", trigger name = '%s', trigger owner uid = %d, status = %s",
882 tracer_token
, trigger_name
,
883 (int) trigger_owner_uid
,
884 error_accounting_status_str(status
));
888 dimension_index
= error_counter_index
;
891 * Go over all error counters (ignoring uid) as a trigger (and trigger
892 * errors) can be generated from any applications that this session
893 * daemon is managing.
895 cds_lfht_for_each_entry(error_counter_uid_ht
->ht
, &iter
.iter
,
896 uid_entry
, node
.node
) {
897 const int ret
= lttng_ust_ctl_counter_clear(uid_entry
->daemon_counter
,
901 uid_t trigger_owner_uid
;
902 const char *trigger_name
;
904 get_trigger_info_for_log(trigger
, &trigger_name
,
906 ERR("Failed to clear event notifier counter value for trigger: counter uid = %d, trigger name = '%s', trigger owner uid = %d",
907 (int) uid_entry
->node
.key
, trigger_name
,
908 (int) trigger_owner_uid
);
909 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
914 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
919 #endif /* HAVE_LIBLTTNG_UST_CTL */
922 enum event_notifier_error_accounting_status
923 event_notifier_error_accounting_kernel_clear(
924 const struct lttng_trigger
*trigger
)
927 uint64_t error_counter_index
;
928 enum event_notifier_error_accounting_status status
;
929 struct lttng_kernel_abi_counter_clear counter_clear
= {};
931 status
= get_error_counter_index_for_token(&kernel_state
,
932 lttng_trigger_get_tracer_token(trigger
),
933 &error_counter_index
);
934 if (status
!= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
) {
935 uid_t trigger_owner_uid
;
936 const char *trigger_name
;
938 get_trigger_info_for_log(
939 trigger
, &trigger_name
, &trigger_owner_uid
);
941 ERR("Failed to get event notifier error counter index: trigger owner uid = %d, trigger name = '%s', status = '%s'",
942 trigger_owner_uid
, trigger_name
,
943 error_accounting_status_str(status
));
947 counter_clear
.index
.number_dimensions
= 1;
948 counter_clear
.index
.dimension_indexes
[0] = error_counter_index
;
950 ret
= kernctl_counter_clear(
951 kernel_error_accounting_entry
.error_counter_fd
,
954 uid_t trigger_owner_uid
;
955 const char *trigger_name
;
957 get_trigger_info_for_log(
958 trigger
, &trigger_name
, &trigger_owner_uid
);
960 ERR("Failed to clear kernel event notifier error counter: trigger owner uid = %d, trigger name = '%s'",
961 trigger_owner_uid
, trigger_name
);
962 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
966 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
971 enum event_notifier_error_accounting_status
972 event_notifier_error_accounting_register_kernel(
973 int kernel_event_notifier_group_fd
)
975 int error_counter_fd
= -1, ret
;
976 enum event_notifier_error_accounting_status status
;
977 lttng_kernel_abi_counter_conf error_counter_conf
= {
978 .arithmetic
= LTTNG_KERNEL_ABI_COUNTER_ARITHMETIC_MODULAR
,
979 .bitness
= sizeof(void *) == sizeof(uint32_t) ?
980 LTTNG_KERNEL_ABI_COUNTER_BITNESS_32
:
981 LTTNG_KERNEL_ABI_COUNTER_BITNESS_64
,
982 .number_dimensions
= 1,
983 .global_sum_step
= 0,
985 error_counter_conf
.dimensions
[0].size
= kernel_state
.number_indices
;
986 error_counter_conf
.dimensions
[0].has_underflow
= false;
987 error_counter_conf
.dimensions
[0].has_overflow
= false;
989 ret
= kernctl_create_event_notifier_group_error_counter(
990 kernel_event_notifier_group_fd
, &error_counter_conf
);
992 PERROR("Failed to create event notifier group error counter through kernel ioctl: kernel_event_notifier_group_fd = %d",
993 kernel_event_notifier_group_fd
);
994 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
998 error_counter_fd
= ret
;
1000 /* Prevent fd duplication after execlp(). */
1001 ret
= fcntl(error_counter_fd
, F_SETFD
, FD_CLOEXEC
);
1003 PERROR("Failed to set FD_CLOEXEC flag on event notifier error counter file descriptor: error_counter_fd = %d",
1005 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
1009 DBG("Created kernel event notifier group error counter: fd = %d",
1012 kernel_error_accounting_entry
.error_counter_fd
=
1014 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
1021 enum event_notifier_error_accounting_status
create_error_counter_index_for_token(
1022 struct error_accounting_state
*state
, uint64_t tracer_token
,
1023 uint64_t *error_counter_index
)
1025 struct index_ht_entry
*index_entry
;
1026 enum lttng_index_allocator_status index_alloc_status
;
1027 uint64_t local_error_counter_index
;
1028 enum event_notifier_error_accounting_status status
;
1030 LTTNG_ASSERT(state
);
1032 /* Allocate a new index for that counter. */
1033 index_alloc_status
= lttng_index_allocator_alloc(state
->index_allocator
,
1034 &local_error_counter_index
);
1035 switch (index_alloc_status
) {
1036 case LTTNG_INDEX_ALLOCATOR_STATUS_EMPTY
:
1037 DBG("No indices left in the configured event notifier error counter: "
1038 "number-of-indices = %" PRIu64
,
1039 lttng_index_allocator_get_index_count(
1040 state
->index_allocator
));
1041 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NO_INDEX_AVAILABLE
;
1043 case LTTNG_INDEX_ALLOCATOR_STATUS_OK
:
1046 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
1050 index_entry
= (index_ht_entry
*) zmalloc(sizeof(*index_entry
));
1051 if (index_entry
== NULL
) {
1052 PERROR("Failed to allocate event notifier error counter hash table entry");
1053 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NOMEM
;
1057 index_entry
->error_counter_index
= local_error_counter_index
;
1058 lttng_ht_node_init_u64(&index_entry
->node
, tracer_token
);
1059 lttng_ht_add_unique_u64(state
->indices_ht
, &index_entry
->node
);
1061 DBG("Allocated error counter index for tracer token: tracer token = %" PRIu64
", index = %" PRIu64
,
1062 tracer_token
, local_error_counter_index
);
1063 *error_counter_index
= local_error_counter_index
;
1064 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
1069 enum event_notifier_error_accounting_status
1070 event_notifier_error_accounting_register_event_notifier(
1071 const struct lttng_trigger
*trigger
,
1072 uint64_t *error_counter_index
)
1074 enum event_notifier_error_accounting_status status
;
1075 uint64_t local_error_counter_index
;
1076 struct error_accounting_state
*state
;
1078 switch (lttng_trigger_get_underlying_domain_type_restriction(trigger
)) {
1079 case LTTNG_DOMAIN_KERNEL
:
1080 state
= &kernel_state
;
1082 case LTTNG_DOMAIN_UST
:
1083 case LTTNG_DOMAIN_PYTHON
:
1084 case LTTNG_DOMAIN_JUL
:
1085 case LTTNG_DOMAIN_LOG4J
:
1093 * Check if this event notifier already has a error counter index
1096 status
= get_error_counter_index_for_token(state
,
1097 lttng_trigger_get_tracer_token(trigger
),
1098 &local_error_counter_index
);
1100 case EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_NOT_FOUND
:
1102 uid_t trigger_owner_uid
;
1103 const char *trigger_name
;
1105 get_trigger_info_for_log(
1106 trigger
, &trigger_name
, &trigger_owner_uid
);
1108 DBG("Event notifier error counter index not found for tracer token (allocating a new one): trigger name = '%s', trigger owner uid = %d, tracer token = %" PRIu64
,
1109 trigger_name
, trigger_owner_uid
,
1110 lttng_trigger_get_tracer_token(trigger
));
1112 status
= create_error_counter_index_for_token(state
,
1113 lttng_trigger_get_tracer_token(trigger
),
1114 &local_error_counter_index
);
1115 if (status
!= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
) {
1116 ERR("Error creating index for token: status = %s, trigger name = '%s', trigger owner uid = %d",
1117 error_accounting_status_str(status
),
1118 trigger_name
, trigger_owner_uid
);
1123 case EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
:
1124 *error_counter_index
= local_error_counter_index
;
1125 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
1131 #ifdef HAVE_LIBLTTNG_UST_CTL
1132 switch (lttng_trigger_get_underlying_domain_type_restriction(trigger
)) {
1133 case LTTNG_DOMAIN_UST
:
1134 case LTTNG_DOMAIN_PYTHON
:
1135 case LTTNG_DOMAIN_JUL
:
1136 case LTTNG_DOMAIN_LOG4J
:
1137 pthread_mutex_lock(&the_event_notifier_counter
.lock
);
1138 the_event_notifier_counter
.count
++;
1139 if (the_event_notifier_counter
.count
== 1) {
1141 * On the first event notifier, we get a reference to
1142 * every existing UID entries. This ensures that the
1143 * entries are kept around if there are still
1144 * registered event notifiers but no apps.
1146 get_ref_all_ust_error_accounting_entry();
1148 pthread_mutex_unlock(&the_event_notifier_counter
.lock
);
1153 #endif /* HAVE_LIBLTTNG_UST_CTL */
1161 enum event_notifier_error_accounting_status
1162 event_notifier_error_accounting_kernel_get_count(
1163 const struct lttng_trigger
*trigger
, uint64_t *count
)
1165 struct lttng_kernel_abi_counter_aggregate counter_aggregate
= {};
1166 enum event_notifier_error_accounting_status status
;
1167 uint64_t error_counter_index
;
1170 status
= get_error_counter_index_for_token(&kernel_state
,
1171 lttng_trigger_get_tracer_token(trigger
),
1172 &error_counter_index
);
1173 if (status
!= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
) {
1174 ERR("Error getting index for token: status=%s",
1175 error_accounting_status_str(status
));
1179 counter_aggregate
.index
.number_dimensions
= 1;
1180 counter_aggregate
.index
.dimension_indexes
[0] = error_counter_index
;
1182 LTTNG_ASSERT(kernel_error_accounting_entry
.error_counter_fd
);
1184 ret
= kernctl_counter_get_aggregate_value(
1185 kernel_error_accounting_entry
.error_counter_fd
,
1186 &counter_aggregate
);
1187 if (ret
|| counter_aggregate
.value
.value
< 0) {
1188 uid_t trigger_owner_uid
;
1189 const char *trigger_name
;
1191 get_trigger_info_for_log(trigger
, &trigger_name
,
1192 &trigger_owner_uid
);
1194 if (counter_aggregate
.value
.value
< 0) {
1195 ERR("Invalid negative event notifier error counter value: trigger owner = %d, trigger name = '%s', value = %" PRId64
,
1196 trigger_owner_uid
, trigger_name
,
1197 counter_aggregate
.value
.value
);
1199 ERR("Failed to getting event notifier error count: trigger owner = %d, trigger name = '%s', ret = %d",
1200 trigger_owner_uid
, trigger_name
, ret
);
1203 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_ERR
;
1207 /* Error count can't be negative. */
1208 LTTNG_ASSERT(counter_aggregate
.value
.value
>= 0);
1209 *count
= (uint64_t) counter_aggregate
.value
.value
;
1211 status
= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
1217 enum event_notifier_error_accounting_status
1218 event_notifier_error_accounting_get_count(
1219 const struct lttng_trigger
*trigger
, uint64_t *count
)
1221 switch (lttng_trigger_get_underlying_domain_type_restriction(trigger
)) {
1222 case LTTNG_DOMAIN_KERNEL
:
1223 return event_notifier_error_accounting_kernel_get_count(
1225 case LTTNG_DOMAIN_UST
:
1226 case LTTNG_DOMAIN_PYTHON
:
1227 case LTTNG_DOMAIN_JUL
:
1228 case LTTNG_DOMAIN_LOG4J
:
1229 #ifdef HAVE_LIBLTTNG_UST_CTL
1230 return event_notifier_error_accounting_ust_get_count(trigger
,
1234 return EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
1235 #endif /* HAVE_LIBLTTNG_UST_CTL */
1242 enum event_notifier_error_accounting_status
1243 event_notifier_error_accounting_clear(const struct lttng_trigger
*trigger
)
1245 switch (lttng_trigger_get_underlying_domain_type_restriction(trigger
)) {
1246 case LTTNG_DOMAIN_KERNEL
:
1247 return event_notifier_error_accounting_kernel_clear(trigger
);
1248 case LTTNG_DOMAIN_UST
:
1249 case LTTNG_DOMAIN_PYTHON
:
1250 case LTTNG_DOMAIN_JUL
:
1251 case LTTNG_DOMAIN_LOG4J
:
1252 #ifdef HAVE_LIBLTTNG_UST_CTL
1253 return event_notifier_error_accounting_ust_clear(trigger
);
1255 return EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
;
1256 #endif /* HAVE_LIBLTTNG_UST_CTL */
1262 static void free_index_ht_entry(struct rcu_head
*head
)
1264 struct index_ht_entry
*entry
= caa_container_of(head
,
1265 struct index_ht_entry
, rcu_head
);
1270 void event_notifier_error_accounting_unregister_event_notifier(
1271 const struct lttng_trigger
*trigger
)
1273 struct lttng_ht_iter iter
;
1274 struct lttng_ht_node_u64
*node
;
1275 const uint64_t tracer_token
= lttng_trigger_get_tracer_token(trigger
);
1276 enum event_notifier_error_accounting_status status
;
1277 struct error_accounting_state
*state
;
1279 status
= event_notifier_error_accounting_clear(trigger
);
1280 if (status
!= EVENT_NOTIFIER_ERROR_ACCOUNTING_STATUS_OK
) {
1281 /* Trigger details already logged by callee on error. */
1282 ERR("Failed to clear event notifier error counter during unregistration of event notifier: status = '%s'",
1283 error_accounting_status_str(status
));
1289 switch (lttng_trigger_get_underlying_domain_type_restriction(trigger
)) {
1290 case LTTNG_DOMAIN_KERNEL
:
1291 state
= &kernel_state
;
1293 #ifdef HAVE_LIBLTTNG_UST_CTL
1294 case LTTNG_DOMAIN_UST
:
1295 case LTTNG_DOMAIN_PYTHON
:
1296 case LTTNG_DOMAIN_JUL
:
1297 case LTTNG_DOMAIN_LOG4J
:
1300 pthread_mutex_lock(&the_event_notifier_counter
.lock
);
1301 the_event_notifier_counter
.count
--;
1302 if (the_event_notifier_counter
.count
== 0) {
1305 * When unregistering the last event notifier, put one
1306 * reference to every uid entries on the behalf of all
1309 put_ref_all_ust_error_accounting_entry();
1312 pthread_mutex_unlock(&the_event_notifier_counter
.lock
);
1315 #endif /* HAVE_LIBLTTNG_UST_CTL */
1320 lttng_ht_lookup(state
->indices_ht
, &tracer_token
, &iter
);
1321 node
= lttng_ht_iter_get_node_u64(&iter
);
1324 struct index_ht_entry
*index_entry
= caa_container_of(
1325 node
, typeof(*index_entry
), node
);
1326 enum lttng_index_allocator_status index_alloc_status
;
1328 index_alloc_status
= lttng_index_allocator_release(
1329 state
->index_allocator
,
1330 index_entry
->error_counter_index
);
1331 if (index_alloc_status
!= LTTNG_INDEX_ALLOCATOR_STATUS_OK
) {
1332 uid_t trigger_owner_uid
;
1333 const char *trigger_name
;
1335 get_trigger_info_for_log(trigger
, &trigger_name
,
1336 &trigger_owner_uid
);
1338 ERR("Failed to release event notifier error counter index: index = %" PRIu64
", trigger name = '%s', trigger owner uid = %d",
1339 index_entry
->error_counter_index
,
1340 trigger_name
, (int) trigger_owner_uid
);
1341 /* Don't exit, perform the rest of the clean-up. */
1344 del_ret
= lttng_ht_del(state
->indices_ht
, &iter
);
1345 LTTNG_ASSERT(!del_ret
);
1346 call_rcu(&index_entry
->rcu_head
, free_index_ht_entry
);
1353 void event_notifier_error_accounting_fini(void)
1355 if (kernel_error_accounting_entry
.error_counter_fd
) {
1356 const int ret
= close(kernel_error_accounting_entry
.error_counter_fd
);
1359 PERROR("Failed to close kernel event notifier error counter");
1363 lttng_ht_destroy(error_counter_uid_ht
);
1365 fini_error_accounting_state(&kernel_state
);
1366 fini_error_accounting_state(&ust_state
);