consumerd: Implement clear stream/session commands
[lttng-tools.git] / src / common / ust-consumer / ust-consumer.c
CommitLineData
3bd1e081
MD
1/*
2 * Copyright (C) 2011 - Julien Desfossez <julien.desfossez@polymtl.ca>
3 * Mathieu Desnoyers <mathieu.desnoyers@efficios.com>
b3530820 4 * Copyright (C) 2017 - Jérémie Galarneau <jeremie.galarneau@efficios.com>
3bd1e081 5 *
d14d33bf
AM
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License, version 2 only,
8 * as published by the Free Software Foundation.
3bd1e081
MD
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
d14d33bf
AM
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
3bd1e081
MD
18 */
19
6c1c0768 20#define _LGPL_SOURCE
3bd1e081 21#include <assert.h>
f02e1e8a 22#include <lttng/ust-ctl.h>
3bd1e081
MD
23#include <poll.h>
24#include <pthread.h>
25#include <stdlib.h>
26#include <string.h>
27#include <sys/mman.h>
28#include <sys/socket.h>
dbb5dfe6 29#include <sys/stat.h>
3bd1e081 30#include <sys/types.h>
77c7c900 31#include <inttypes.h>
3bd1e081 32#include <unistd.h>
ffe60014 33#include <urcu/list.h>
331744e3 34#include <signal.h>
0857097f 35
51a9e1c7 36#include <bin/lttng-consumerd/health-consumerd.h>
990570ed 37#include <common/common.h>
10a8a223 38#include <common/sessiond-comm/sessiond-comm.h>
00e2e675 39#include <common/relayd/relayd.h>
dbb5dfe6 40#include <common/compat/fcntl.h>
f263b7fd 41#include <common/compat/endian.h>
c8fea79c
JR
42#include <common/consumer/consumer-metadata-cache.h>
43#include <common/consumer/consumer-stream.h>
44#include <common/consumer/consumer-timer.h>
fe4477ee 45#include <common/utils.h>
309167d2 46#include <common/index/index.h>
10a8a223
DG
47
48#include "ust-consumer.h"
3bd1e081 49
45863397 50#define INT_MAX_STR_LEN 12 /* includes \0 */
4628484a 51
3bd1e081
MD
52extern struct lttng_consumer_global_data consumer_data;
53extern int consumer_poll_timeout;
3bd1e081
MD
54
55/*
ffe60014
DG
56 * Free channel object and all streams associated with it. This MUST be used
57 * only and only if the channel has _NEVER_ been added to the global channel
58 * hash table.
3bd1e081 59 */
ffe60014 60static void destroy_channel(struct lttng_consumer_channel *channel)
3bd1e081 61{
ffe60014
DG
62 struct lttng_consumer_stream *stream, *stmp;
63
64 assert(channel);
65
66 DBG("UST consumer cleaning stream list");
67
68 cds_list_for_each_entry_safe(stream, stmp, &channel->streams.head,
69 send_node) {
9ce5646a
MD
70
71 health_code_update();
72
ffe60014
DG
73 cds_list_del(&stream->send_node);
74 ustctl_destroy_stream(stream->ustream);
75 free(stream);
76 }
77
78 /*
79 * If a channel is available meaning that was created before the streams
80 * were, delete it.
81 */
82 if (channel->uchan) {
83 lttng_ustconsumer_del_channel(channel);
b83e03c4 84 lttng_ustconsumer_free_channel(channel);
ffe60014
DG
85 }
86 free(channel);
87}
3bd1e081
MD
88
89/*
ffe60014 90 * Add channel to internal consumer state.
3bd1e081 91 *
ffe60014 92 * Returns 0 on success or else a negative value.
3bd1e081 93 */
ffe60014
DG
94static int add_channel(struct lttng_consumer_channel *channel,
95 struct lttng_consumer_local_data *ctx)
3bd1e081
MD
96{
97 int ret = 0;
98
ffe60014
DG
99 assert(channel);
100 assert(ctx);
101
102 if (ctx->on_recv_channel != NULL) {
103 ret = ctx->on_recv_channel(channel);
104 if (ret == 0) {
d8ef542d 105 ret = consumer_add_channel(channel, ctx);
ffe60014
DG
106 } else if (ret < 0) {
107 /* Most likely an ENOMEM. */
108 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_OUTFD_ERROR);
109 goto error;
110 }
111 } else {
d8ef542d 112 ret = consumer_add_channel(channel, ctx);
3bd1e081
MD
113 }
114
d88aee68 115 DBG("UST consumer channel added (key: %" PRIu64 ")", channel->key);
ffe60014
DG
116
117error:
3bd1e081
MD
118 return ret;
119}
120
121/*
ffe60014
DG
122 * Allocate and return a consumer channel object.
123 */
124static struct lttng_consumer_channel *allocate_channel(uint64_t session_id,
125 const char *pathname, const char *name, uid_t uid, gid_t gid,
da009f2c 126 uint64_t relayd_id, uint64_t key, enum lttng_event_output output,
2bba9e53 127 uint64_t tracefile_size, uint64_t tracefile_count,
ecc48a90 128 uint64_t session_id_per_pid, unsigned int monitor,
d7ba1388 129 unsigned int live_timer_interval,
3d071855 130 const char *root_shm_path, const char *shm_path)
ffe60014
DG
131{
132 assert(pathname);
133 assert(name);
134
1950109e
JD
135 return consumer_allocate_channel(key, session_id, pathname, name, uid,
136 gid, relayd_id, output, tracefile_size,
d7ba1388 137 tracefile_count, session_id_per_pid, monitor,
3d071855 138 live_timer_interval, root_shm_path, shm_path);
ffe60014
DG
139}
140
141/*
142 * Allocate and return a consumer stream object. If _alloc_ret is not NULL, the
143 * error value if applicable is set in it else it is kept untouched.
3bd1e081 144 *
ffe60014 145 * Return NULL on error else the newly allocated stream object.
3bd1e081 146 */
ffe60014
DG
147static struct lttng_consumer_stream *allocate_stream(int cpu, int key,
148 struct lttng_consumer_channel *channel,
149 struct lttng_consumer_local_data *ctx, int *_alloc_ret)
150{
151 int alloc_ret;
152 struct lttng_consumer_stream *stream = NULL;
153
154 assert(channel);
155 assert(ctx);
156
157 stream = consumer_allocate_stream(channel->key,
158 key,
159 LTTNG_CONSUMER_ACTIVE_STREAM,
160 channel->name,
161 channel->uid,
162 channel->gid,
163 channel->relayd_id,
164 channel->session_id,
165 cpu,
166 &alloc_ret,
4891ece8
DG
167 channel->type,
168 channel->monitor);
ffe60014
DG
169 if (stream == NULL) {
170 switch (alloc_ret) {
171 case -ENOENT:
172 /*
173 * We could not find the channel. Can happen if cpu hotplug
174 * happens while tearing down.
175 */
176 DBG3("Could not find channel");
177 break;
178 case -ENOMEM:
179 case -EINVAL:
180 default:
181 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_OUTFD_ERROR);
182 break;
183 }
184 goto error;
185 }
186
187 stream->chan = channel;
188
189error:
190 if (_alloc_ret) {
191 *_alloc_ret = alloc_ret;
192 }
193 return stream;
194}
195
196/*
197 * Send the given stream pointer to the corresponding thread.
198 *
199 * Returns 0 on success else a negative value.
200 */
201static int send_stream_to_thread(struct lttng_consumer_stream *stream,
202 struct lttng_consumer_local_data *ctx)
203{
dae10966
DG
204 int ret;
205 struct lttng_pipe *stream_pipe;
ffe60014
DG
206
207 /* Get the right pipe where the stream will be sent. */
208 if (stream->metadata_flag) {
5ab66908
MD
209 ret = consumer_add_metadata_stream(stream);
210 if (ret) {
211 ERR("Consumer add metadata stream %" PRIu64 " failed.",
212 stream->key);
213 goto error;
214 }
dae10966 215 stream_pipe = ctx->consumer_metadata_pipe;
ffe60014 216 } else {
5ab66908
MD
217 ret = consumer_add_data_stream(stream);
218 if (ret) {
219 ERR("Consumer add stream %" PRIu64 " failed.",
220 stream->key);
221 goto error;
222 }
dae10966 223 stream_pipe = ctx->consumer_data_pipe;
ffe60014
DG
224 }
225
5ab66908
MD
226 /*
227 * From this point on, the stream's ownership has been moved away from
228 * the channel and becomes globally visible.
229 */
230 stream->globally_visible = 1;
231
dae10966 232 ret = lttng_pipe_write(stream_pipe, &stream, sizeof(stream));
ffe60014 233 if (ret < 0) {
dae10966
DG
234 ERR("Consumer write %s stream to pipe %d",
235 stream->metadata_flag ? "metadata" : "data",
236 lttng_pipe_get_writefd(stream_pipe));
5ab66908
MD
237 if (stream->metadata_flag) {
238 consumer_del_stream_for_metadata(stream);
239 } else {
240 consumer_del_stream_for_data(stream);
241 }
ffe60014 242 }
5ab66908 243error:
ffe60014
DG
244 return ret;
245}
246
4628484a
MD
247static
248int get_stream_shm_path(char *stream_shm_path, const char *shm_path, int cpu)
249{
45863397 250 char cpu_nr[INT_MAX_STR_LEN]; /* int max len */
4628484a
MD
251 int ret;
252
253 strncpy(stream_shm_path, shm_path, PATH_MAX);
254 stream_shm_path[PATH_MAX - 1] = '\0';
45863397 255 ret = snprintf(cpu_nr, INT_MAX_STR_LEN, "%i", cpu);
67f8cb8d
MD
256 if (ret < 0) {
257 PERROR("snprintf");
4628484a
MD
258 goto end;
259 }
260 strncat(stream_shm_path, cpu_nr,
261 PATH_MAX - strlen(stream_shm_path) - 1);
262 ret = 0;
263end:
264 return ret;
265}
266
d88aee68
DG
267/*
268 * Create streams for the given channel using liblttng-ust-ctl.
269 *
270 * Return 0 on success else a negative value.
271 */
ffe60014
DG
272static int create_ust_streams(struct lttng_consumer_channel *channel,
273 struct lttng_consumer_local_data *ctx)
274{
275 int ret, cpu = 0;
276 struct ustctl_consumer_stream *ustream;
277 struct lttng_consumer_stream *stream;
278
279 assert(channel);
280 assert(ctx);
281
282 /*
283 * While a stream is available from ustctl. When NULL is returned, we've
284 * reached the end of the possible stream for the channel.
285 */
286 while ((ustream = ustctl_create_stream(channel->uchan, cpu))) {
287 int wait_fd;
04ef1097 288 int ust_metadata_pipe[2];
ffe60014 289
9ce5646a
MD
290 health_code_update();
291
04ef1097
MD
292 if (channel->type == CONSUMER_CHANNEL_TYPE_METADATA && channel->monitor) {
293 ret = utils_create_pipe_cloexec_nonblock(ust_metadata_pipe);
294 if (ret < 0) {
295 ERR("Create ust metadata poll pipe");
296 goto error;
297 }
298 wait_fd = ust_metadata_pipe[0];
299 } else {
300 wait_fd = ustctl_stream_get_wait_fd(ustream);
301 }
ffe60014
DG
302
303 /* Allocate consumer stream object. */
304 stream = allocate_stream(cpu, wait_fd, channel, ctx, &ret);
305 if (!stream) {
306 goto error_alloc;
307 }
308 stream->ustream = ustream;
309 /*
310 * Store it so we can save multiple function calls afterwards since
311 * this value is used heavily in the stream threads. This is UST
312 * specific so this is why it's done after allocation.
313 */
314 stream->wait_fd = wait_fd;
315
b31398bb
DG
316 /*
317 * Increment channel refcount since the channel reference has now been
318 * assigned in the allocation process above.
319 */
10a50311
JD
320 if (stream->chan->monitor) {
321 uatomic_inc(&stream->chan->refcount);
322 }
b31398bb 323
ffe60014
DG
324 /*
325 * Order is important this is why a list is used. On error, the caller
326 * should clean this list.
327 */
328 cds_list_add_tail(&stream->send_node, &channel->streams.head);
329
330 ret = ustctl_get_max_subbuf_size(stream->ustream,
331 &stream->max_sb_size);
332 if (ret < 0) {
333 ERR("ustctl_get_max_subbuf_size failed for stream %s",
334 stream->name);
335 goto error;
336 }
337
338 /* Do actions once stream has been received. */
339 if (ctx->on_recv_stream) {
340 ret = ctx->on_recv_stream(stream);
341 if (ret < 0) {
342 goto error;
343 }
344 }
345
d88aee68 346 DBG("UST consumer add stream %s (key: %" PRIu64 ") with relayd id %" PRIu64,
ffe60014
DG
347 stream->name, stream->key, stream->relayd_stream_id);
348
349 /* Set next CPU stream. */
350 channel->streams.count = ++cpu;
d88aee68
DG
351
352 /* Keep stream reference when creating metadata. */
353 if (channel->type == CONSUMER_CHANNEL_TYPE_METADATA) {
354 channel->metadata_stream = stream;
8de4f941
JG
355 if (channel->monitor) {
356 /* Set metadata poll pipe if we created one */
357 memcpy(stream->ust_metadata_poll_pipe,
358 ust_metadata_pipe,
359 sizeof(ust_metadata_pipe));
360 }
d88aee68 361 }
ffe60014
DG
362 }
363
364 return 0;
365
366error:
367error_alloc:
368 return ret;
369}
370
4628484a
MD
371/*
372 * create_posix_shm is never called concurrently within a process.
373 */
374static
375int create_posix_shm(void)
376{
377 char tmp_name[NAME_MAX];
378 int shmfd, ret;
379
380 ret = snprintf(tmp_name, NAME_MAX, "/ust-shm-consumer-%d", getpid());
381 if (ret < 0) {
382 PERROR("snprintf");
383 return -1;
384 }
385 /*
386 * Allocate shm, and immediately unlink its shm oject, keeping
387 * only the file descriptor as a reference to the object.
388 * We specifically do _not_ use the / at the beginning of the
389 * pathname so that some OS implementations can keep it local to
390 * the process (POSIX leaves this implementation-defined).
391 */
392 shmfd = shm_open(tmp_name, O_CREAT | O_EXCL | O_RDWR, 0700);
393 if (shmfd < 0) {
394 PERROR("shm_open");
395 goto error_shm_open;
396 }
397 ret = shm_unlink(tmp_name);
398 if (ret < 0 && errno != ENOENT) {
399 PERROR("shm_unlink");
400 goto error_shm_release;
401 }
402 return shmfd;
403
404error_shm_release:
405 ret = close(shmfd);
406 if (ret) {
407 PERROR("close");
408 }
409error_shm_open:
410 return -1;
411}
412
413static int open_ust_stream_fd(struct lttng_consumer_channel *channel,
414 struct ustctl_consumer_channel_attr *attr,
415 int cpu)
416{
417 char shm_path[PATH_MAX];
418 int ret;
419
420 if (!channel->shm_path[0]) {
421 return create_posix_shm();
422 }
423 ret = get_stream_shm_path(shm_path, channel->shm_path, cpu);
424 if (ret) {
425 goto error_shm_path;
426 }
427 return run_as_open(shm_path,
428 O_RDWR | O_CREAT | O_EXCL, S_IRUSR | S_IWUSR,
429 channel->uid, channel->gid);
430
431error_shm_path:
432 return -1;
433}
434
ffe60014
DG
435/*
436 * Create an UST channel with the given attributes and send it to the session
437 * daemon using the ust ctl API.
438 *
439 * Return 0 on success or else a negative value.
440 */
4628484a
MD
441static int create_ust_channel(struct lttng_consumer_channel *channel,
442 struct ustctl_consumer_channel_attr *attr,
443 struct ustctl_consumer_channel **ust_chanp)
ffe60014 444{
4628484a
MD
445 int ret, nr_stream_fds, i, j;
446 int *stream_fds;
447 struct ustctl_consumer_channel *ust_channel;
ffe60014 448
4628484a 449 assert(channel);
ffe60014 450 assert(attr);
4628484a 451 assert(ust_chanp);
ffe60014
DG
452
453 DBG3("Creating channel to ustctl with attr: [overwrite: %d, "
454 "subbuf_size: %" PRIu64 ", num_subbuf: %" PRIu64 ", "
455 "switch_timer_interval: %u, read_timer_interval: %u, "
456 "output: %d, type: %d", attr->overwrite, attr->subbuf_size,
457 attr->num_subbuf, attr->switch_timer_interval,
458 attr->read_timer_interval, attr->output, attr->type);
459
4628484a
MD
460 if (channel->type == CONSUMER_CHANNEL_TYPE_METADATA)
461 nr_stream_fds = 1;
462 else
463 nr_stream_fds = ustctl_get_nr_stream_per_channel();
464 stream_fds = zmalloc(nr_stream_fds * sizeof(*stream_fds));
465 if (!stream_fds) {
466 ret = -1;
467 goto error_alloc;
468 }
469 for (i = 0; i < nr_stream_fds; i++) {
470 stream_fds[i] = open_ust_stream_fd(channel, attr, i);
471 if (stream_fds[i] < 0) {
472 ret = -1;
473 goto error_open;
474 }
475 }
476 ust_channel = ustctl_create_channel(attr, stream_fds, nr_stream_fds);
477 if (!ust_channel) {
ffe60014
DG
478 ret = -1;
479 goto error_create;
480 }
4628484a
MD
481 channel->nr_stream_fds = nr_stream_fds;
482 channel->stream_fds = stream_fds;
483 *ust_chanp = ust_channel;
ffe60014
DG
484
485 return 0;
486
487error_create:
4628484a
MD
488error_open:
489 for (j = i - 1; j >= 0; j--) {
490 int closeret;
491
492 closeret = close(stream_fds[j]);
493 if (closeret) {
494 PERROR("close");
495 }
496 if (channel->shm_path[0]) {
497 char shm_path[PATH_MAX];
498
499 closeret = get_stream_shm_path(shm_path,
500 channel->shm_path, j);
501 if (closeret) {
502 ERR("Cannot get stream shm path");
503 }
504 closeret = run_as_unlink(shm_path,
505 channel->uid, channel->gid);
506 if (closeret) {
4628484a
MD
507 PERROR("unlink %s", shm_path);
508 }
509 }
510 }
511 /* Try to rmdir all directories under shm_path root. */
512 if (channel->root_shm_path[0]) {
602766ec 513 (void) run_as_rmdir_recursive(channel->root_shm_path,
4628484a
MD
514 channel->uid, channel->gid);
515 }
516 free(stream_fds);
517error_alloc:
ffe60014
DG
518 return ret;
519}
520
d88aee68
DG
521/*
522 * Send a single given stream to the session daemon using the sock.
523 *
524 * Return 0 on success else a negative value.
525 */
ffe60014
DG
526static int send_sessiond_stream(int sock, struct lttng_consumer_stream *stream)
527{
528 int ret;
529
530 assert(stream);
531 assert(sock >= 0);
532
3eb914c0 533 DBG("UST consumer sending stream %" PRIu64 " to sessiond", stream->key);
ffe60014
DG
534
535 /* Send stream to session daemon. */
536 ret = ustctl_send_stream_to_sessiond(sock, stream->ustream);
537 if (ret < 0) {
538 goto error;
539 }
540
ffe60014
DG
541error:
542 return ret;
543}
544
545/*
546 * Send channel to sessiond.
547 *
d88aee68 548 * Return 0 on success or else a negative value.
ffe60014
DG
549 */
550static int send_sessiond_channel(int sock,
551 struct lttng_consumer_channel *channel,
552 struct lttng_consumer_local_data *ctx, int *relayd_error)
553{
0c759fc9 554 int ret, ret_code = LTTCOMM_CONSUMERD_SUCCESS;
ffe60014 555 struct lttng_consumer_stream *stream;
a4baae1b 556 uint64_t net_seq_idx = -1ULL;
ffe60014
DG
557
558 assert(channel);
559 assert(ctx);
560 assert(sock >= 0);
561
562 DBG("UST consumer sending channel %s to sessiond", channel->name);
563
62285ea4
DG
564 if (channel->relayd_id != (uint64_t) -1ULL) {
565 cds_list_for_each_entry(stream, &channel->streams.head, send_node) {
9ce5646a
MD
566
567 health_code_update();
568
62285ea4
DG
569 /* Try to send the stream to the relayd if one is available. */
570 ret = consumer_send_relayd_stream(stream, stream->chan->pathname);
571 if (ret < 0) {
572 /*
573 * Flag that the relayd was the problem here probably due to a
574 * communicaton error on the socket.
575 */
576 if (relayd_error) {
577 *relayd_error = 1;
578 }
725d28b2 579 ret_code = LTTCOMM_CONSUMERD_RELAYD_FAIL;
ffe60014 580 }
a4baae1b
JD
581 if (net_seq_idx == -1ULL) {
582 net_seq_idx = stream->net_seq_idx;
583 }
584 }
f2a444f1 585 }
ffe60014 586
f2a444f1
DG
587 /* Inform sessiond that we are about to send channel and streams. */
588 ret = consumer_send_status_msg(sock, ret_code);
0c759fc9 589 if (ret < 0 || ret_code != LTTCOMM_CONSUMERD_SUCCESS) {
f2a444f1
DG
590 /*
591 * Either the session daemon is not responding or the relayd died so we
592 * stop now.
593 */
594 goto error;
595 }
596
597 /* Send channel to sessiond. */
598 ret = ustctl_send_channel_to_sessiond(sock, channel->uchan);
599 if (ret < 0) {
600 goto error;
601 }
602
603 ret = ustctl_channel_close_wakeup_fd(channel->uchan);
604 if (ret < 0) {
605 goto error;
606 }
607
608 /* The channel was sent successfully to the sessiond at this point. */
609 cds_list_for_each_entry(stream, &channel->streams.head, send_node) {
9ce5646a
MD
610
611 health_code_update();
612
ffe60014
DG
613 /* Send stream to session daemon. */
614 ret = send_sessiond_stream(sock, stream);
615 if (ret < 0) {
616 goto error;
617 }
618 }
619
620 /* Tell sessiond there is no more stream. */
621 ret = ustctl_send_stream_to_sessiond(sock, NULL);
622 if (ret < 0) {
623 goto error;
624 }
625
626 DBG("UST consumer NULL stream sent to sessiond");
627
628 return 0;
629
630error:
0c759fc9 631 if (ret_code != LTTCOMM_CONSUMERD_SUCCESS) {
f2a444f1
DG
632 ret = -1;
633 }
ffe60014
DG
634 return ret;
635}
636
637/*
638 * Creates a channel and streams and add the channel it to the channel internal
639 * state. The created stream must ONLY be sent once the GET_CHANNEL command is
640 * received.
641 *
642 * Return 0 on success or else, a negative value is returned and the channel
643 * MUST be destroyed by consumer_del_channel().
644 */
645static int ask_channel(struct lttng_consumer_local_data *ctx, int sock,
646 struct lttng_consumer_channel *channel,
647 struct ustctl_consumer_channel_attr *attr)
3bd1e081
MD
648{
649 int ret;
650
ffe60014
DG
651 assert(ctx);
652 assert(channel);
653 assert(attr);
654
655 /*
656 * This value is still used by the kernel consumer since for the kernel,
657 * the stream ownership is not IN the consumer so we need to have the
658 * number of left stream that needs to be initialized so we can know when
659 * to delete the channel (see consumer.c).
660 *
661 * As for the user space tracer now, the consumer creates and sends the
662 * stream to the session daemon which only sends them to the application
663 * once every stream of a channel is received making this value useless
664 * because we they will be added to the poll thread before the application
665 * receives them. This ensures that a stream can not hang up during
666 * initilization of a channel.
667 */
668 channel->nb_init_stream_left = 0;
669
670 /* The reply msg status is handled in the following call. */
4628484a 671 ret = create_ust_channel(channel, attr, &channel->uchan);
ffe60014 672 if (ret < 0) {
10a50311 673 goto end;
3bd1e081
MD
674 }
675
d8ef542d
MD
676 channel->wait_fd = ustctl_channel_get_wait_fd(channel->uchan);
677
10a50311
JD
678 /*
679 * For the snapshots (no monitor), we create the metadata streams
680 * on demand, not during the channel creation.
681 */
682 if (channel->type == CONSUMER_CHANNEL_TYPE_METADATA && !channel->monitor) {
683 ret = 0;
684 goto end;
685 }
686
ffe60014
DG
687 /* Open all streams for this channel. */
688 ret = create_ust_streams(channel, ctx);
689 if (ret < 0) {
10a50311 690 goto end;
ffe60014
DG
691 }
692
10a50311 693end:
3bd1e081
MD
694 return ret;
695}
696
d88aee68
DG
697/*
698 * Send all stream of a channel to the right thread handling it.
699 *
700 * On error, return a negative value else 0 on success.
701 */
702static int send_streams_to_thread(struct lttng_consumer_channel *channel,
703 struct lttng_consumer_local_data *ctx)
704{
705 int ret = 0;
706 struct lttng_consumer_stream *stream, *stmp;
707
708 assert(channel);
709 assert(ctx);
710
711 /* Send streams to the corresponding thread. */
712 cds_list_for_each_entry_safe(stream, stmp, &channel->streams.head,
713 send_node) {
9ce5646a
MD
714
715 health_code_update();
716
d88aee68
DG
717 /* Sending the stream to the thread. */
718 ret = send_stream_to_thread(stream, ctx);
719 if (ret < 0) {
720 /*
721 * If we are unable to send the stream to the thread, there is
722 * a big problem so just stop everything.
723 */
5ab66908
MD
724 /* Remove node from the channel stream list. */
725 cds_list_del(&stream->send_node);
d88aee68
DG
726 goto error;
727 }
728
729 /* Remove node from the channel stream list. */
730 cds_list_del(&stream->send_node);
4891ece8 731
d88aee68
DG
732 }
733
734error:
735 return ret;
736}
737
7972aab2
DG
738/*
739 * Flush channel's streams using the given key to retrieve the channel.
740 *
741 * Return 0 on success else an LTTng error code.
742 */
743static int flush_channel(uint64_t chan_key)
744{
745 int ret = 0;
746 struct lttng_consumer_channel *channel;
747 struct lttng_consumer_stream *stream;
748 struct lttng_ht *ht;
749 struct lttng_ht_iter iter;
750
8fd623e0 751 DBG("UST consumer flush channel key %" PRIu64, chan_key);
7972aab2 752
a500c257 753 rcu_read_lock();
7972aab2
DG
754 channel = consumer_find_channel(chan_key);
755 if (!channel) {
8fd623e0 756 ERR("UST consumer flush channel %" PRIu64 " not found", chan_key);
7972aab2
DG
757 ret = LTTNG_ERR_UST_CHAN_NOT_FOUND;
758 goto error;
759 }
760
761 ht = consumer_data.stream_per_chan_id_ht;
762
763 /* For each stream of the channel id, flush it. */
7972aab2
DG
764 cds_lfht_for_each_entry_duplicate(ht->ht,
765 ht->hash_fct(&channel->key, lttng_ht_seed), ht->match_fct,
766 &channel->key, &iter.iter, stream, node_channel_id.node) {
9ce5646a
MD
767
768 health_code_update();
769
0dd01979
MD
770 pthread_mutex_lock(&stream->lock);
771 if (!stream->quiescent) {
772 ustctl_flush_buffer(stream->ustream, 0);
773 stream->quiescent = true;
774 }
775 pthread_mutex_unlock(&stream->lock);
776 }
777error:
778 rcu_read_unlock();
779 return ret;
780}
781
782/*
783 * Clear quiescent state from channel's streams using the given key to
784 * retrieve the channel.
785 *
786 * Return 0 on success else an LTTng error code.
787 */
788static int clear_quiescent_channel(uint64_t chan_key)
789{
790 int ret = 0;
791 struct lttng_consumer_channel *channel;
792 struct lttng_consumer_stream *stream;
793 struct lttng_ht *ht;
794 struct lttng_ht_iter iter;
795
796 DBG("UST consumer clear quiescent channel key %" PRIu64, chan_key);
797
798 rcu_read_lock();
799 channel = consumer_find_channel(chan_key);
800 if (!channel) {
801 ERR("UST consumer clear quiescent channel %" PRIu64 " not found", chan_key);
802 ret = LTTNG_ERR_UST_CHAN_NOT_FOUND;
803 goto error;
804 }
805
806 ht = consumer_data.stream_per_chan_id_ht;
807
808 /* For each stream of the channel id, clear quiescent state. */
809 cds_lfht_for_each_entry_duplicate(ht->ht,
810 ht->hash_fct(&channel->key, lttng_ht_seed), ht->match_fct,
811 &channel->key, &iter.iter, stream, node_channel_id.node) {
812
813 health_code_update();
814
815 pthread_mutex_lock(&stream->lock);
816 stream->quiescent = false;
817 pthread_mutex_unlock(&stream->lock);
7972aab2 818 }
7972aab2 819error:
a500c257 820 rcu_read_unlock();
7972aab2
DG
821 return ret;
822}
823
d88aee68
DG
824/*
825 * Close metadata stream wakeup_fd using the given key to retrieve the channel.
a500c257 826 * RCU read side lock MUST be acquired before calling this function.
d88aee68
DG
827 *
828 * Return 0 on success else an LTTng error code.
829 */
830static int close_metadata(uint64_t chan_key)
831{
ea88ca2a 832 int ret = 0;
d88aee68 833 struct lttng_consumer_channel *channel;
85aa60d7 834 unsigned int channel_monitor;
d88aee68 835
8fd623e0 836 DBG("UST consumer close metadata key %" PRIu64, chan_key);
d88aee68
DG
837
838 channel = consumer_find_channel(chan_key);
839 if (!channel) {
84cc9aa0
DG
840 /*
841 * This is possible if the metadata thread has issue a delete because
842 * the endpoint point of the stream hung up. There is no way the
843 * session daemon can know about it thus use a DBG instead of an actual
844 * error.
845 */
846 DBG("UST consumer close metadata %" PRIu64 " not found", chan_key);
d88aee68
DG
847 ret = LTTNG_ERR_UST_CHAN_NOT_FOUND;
848 goto error;
849 }
850
ea88ca2a 851 pthread_mutex_lock(&consumer_data.lock);
a9838785 852 pthread_mutex_lock(&channel->lock);
85aa60d7 853 channel_monitor = channel->monitor;
73811ecc
DG
854 if (cds_lfht_is_node_deleted(&channel->node.node)) {
855 goto error_unlock;
856 }
857
6d574024 858 lttng_ustconsumer_close_metadata(channel);
85aa60d7
JG
859 pthread_mutex_unlock(&channel->lock);
860 pthread_mutex_unlock(&consumer_data.lock);
d88aee68 861
85aa60d7
JG
862 /*
863 * The ownership of a metadata channel depends on the type of
864 * session to which it belongs. In effect, the monitor flag is checked
865 * to determine if this metadata channel is in "snapshot" mode or not.
866 *
867 * In the non-snapshot case, the metadata channel is created along with
868 * a single stream which will remain present until the metadata channel
869 * is destroyed (on the destruction of its session). In this case, the
870 * metadata stream in "monitored" by the metadata poll thread and holds
871 * the ownership of its channel.
872 *
873 * Closing the metadata will cause the metadata stream's "metadata poll
874 * pipe" to be closed. Closing this pipe will wake-up the metadata poll
875 * thread which will teardown the metadata stream which, in return,
876 * deletes the metadata channel.
877 *
878 * In the snapshot case, the metadata stream is created and destroyed
879 * on every snapshot record. Since the channel doesn't have an owner
880 * other than the session daemon, it is safe to destroy it immediately
881 * on reception of the CLOSE_METADATA command.
882 */
883 if (!channel_monitor) {
884 /*
885 * The channel and consumer_data locks must be
886 * released before this call since consumer_del_channel
887 * re-acquires the channel and consumer_data locks to teardown
888 * the channel and queue its reclamation by the "call_rcu"
889 * worker thread.
890 */
891 consumer_del_channel(channel);
892 }
893
894 return ret;
ea88ca2a 895error_unlock:
a9838785 896 pthread_mutex_unlock(&channel->lock);
ea88ca2a 897 pthread_mutex_unlock(&consumer_data.lock);
d88aee68
DG
898error:
899 return ret;
900}
901
902/*
903 * RCU read side lock MUST be acquired before calling this function.
904 *
905 * Return 0 on success else an LTTng error code.
906 */
907static int setup_metadata(struct lttng_consumer_local_data *ctx, uint64_t key)
908{
909 int ret;
910 struct lttng_consumer_channel *metadata;
911
8fd623e0 912 DBG("UST consumer setup metadata key %" PRIu64, key);
d88aee68
DG
913
914 metadata = consumer_find_channel(key);
915 if (!metadata) {
916 ERR("UST consumer push metadata %" PRIu64 " not found", key);
917 ret = LTTNG_ERR_UST_CHAN_NOT_FOUND;
10a50311
JD
918 goto end;
919 }
920
921 /*
922 * In no monitor mode, the metadata channel has no stream(s) so skip the
923 * ownership transfer to the metadata thread.
924 */
925 if (!metadata->monitor) {
926 DBG("Metadata channel in no monitor");
927 ret = 0;
928 goto end;
d88aee68
DG
929 }
930
931 /*
932 * Send metadata stream to relayd if one available. Availability is
933 * known if the stream is still in the list of the channel.
934 */
935 if (cds_list_empty(&metadata->streams.head)) {
936 ERR("Metadata channel key %" PRIu64 ", no stream available.", key);
937 ret = LTTCOMM_CONSUMERD_ERROR_METADATA;
f5a0c9cf 938 goto error_no_stream;
d88aee68
DG
939 }
940
941 /* Send metadata stream to relayd if needed. */
62285ea4
DG
942 if (metadata->metadata_stream->net_seq_idx != (uint64_t) -1ULL) {
943 ret = consumer_send_relayd_stream(metadata->metadata_stream,
944 metadata->pathname);
945 if (ret < 0) {
946 ret = LTTCOMM_CONSUMERD_ERROR_METADATA;
947 goto error;
948 }
601262d6
JD
949 ret = consumer_send_relayd_streams_sent(
950 metadata->metadata_stream->net_seq_idx);
951 if (ret < 0) {
952 ret = LTTCOMM_CONSUMERD_RELAYD_FAIL;
953 goto error;
954 }
d88aee68
DG
955 }
956
957 ret = send_streams_to_thread(metadata, ctx);
958 if (ret < 0) {
959 /*
960 * If we are unable to send the stream to the thread, there is
961 * a big problem so just stop everything.
962 */
963 ret = LTTCOMM_CONSUMERD_FATAL;
964 goto error;
965 }
966 /* List MUST be empty after or else it could be reused. */
967 assert(cds_list_empty(&metadata->streams.head));
968
10a50311
JD
969 ret = 0;
970 goto end;
d88aee68
DG
971
972error:
f2a444f1
DG
973 /*
974 * Delete metadata channel on error. At this point, the metadata stream can
975 * NOT be monitored by the metadata thread thus having the guarantee that
976 * the stream is still in the local stream list of the channel. This call
977 * will make sure to clean that list.
978 */
f5a0c9cf 979 consumer_stream_destroy(metadata->metadata_stream, NULL);
212d67a2
DG
980 cds_list_del(&metadata->metadata_stream->send_node);
981 metadata->metadata_stream = NULL;
f5a0c9cf 982error_no_stream:
10a50311
JD
983end:
984 return ret;
985}
986
987/*
988 * Snapshot the whole metadata.
989 *
990 * Returns 0 on success, < 0 on error
991 */
992static int snapshot_metadata(uint64_t key, char *path, uint64_t relayd_id,
993 struct lttng_consumer_local_data *ctx)
994{
995 int ret = 0;
10a50311
JD
996 struct lttng_consumer_channel *metadata_channel;
997 struct lttng_consumer_stream *metadata_stream;
998
999 assert(path);
1000 assert(ctx);
1001
1002 DBG("UST consumer snapshot metadata with key %" PRIu64 " at path %s",
1003 key, path);
1004
1005 rcu_read_lock();
1006
1007 metadata_channel = consumer_find_channel(key);
1008 if (!metadata_channel) {
6a00837f
MD
1009 ERR("UST snapshot metadata channel not found for key %" PRIu64,
1010 key);
10a50311
JD
1011 ret = -1;
1012 goto error;
1013 }
1014 assert(!metadata_channel->monitor);
1015
9ce5646a
MD
1016 health_code_update();
1017
10a50311
JD
1018 /*
1019 * Ask the sessiond if we have new metadata waiting and update the
1020 * consumer metadata cache.
1021 */
94d49140 1022 ret = lttng_ustconsumer_request_metadata(ctx, metadata_channel, 0, 1);
10a50311
JD
1023 if (ret < 0) {
1024 goto error;
1025 }
1026
9ce5646a
MD
1027 health_code_update();
1028
10a50311
JD
1029 /*
1030 * The metadata stream is NOT created in no monitor mode when the channel
1031 * is created on a sessiond ask channel command.
1032 */
1033 ret = create_ust_streams(metadata_channel, ctx);
1034 if (ret < 0) {
1035 goto error;
1036 }
1037
1038 metadata_stream = metadata_channel->metadata_stream;
1039 assert(metadata_stream);
1040
1041 if (relayd_id != (uint64_t) -1ULL) {
1042 metadata_stream->net_seq_idx = relayd_id;
1043 ret = consumer_send_relayd_stream(metadata_stream, path);
1044 if (ret < 0) {
1045 goto error_stream;
1046 }
1047 } else {
1048 ret = utils_create_stream_file(path, metadata_stream->name,
1049 metadata_stream->chan->tracefile_size,
1050 metadata_stream->tracefile_count_current,
309167d2 1051 metadata_stream->uid, metadata_stream->gid, NULL);
10a50311
JD
1052 if (ret < 0) {
1053 goto error_stream;
1054 }
1055 metadata_stream->out_fd = ret;
1056 metadata_stream->tracefile_size_current = 0;
1057 }
1058
04ef1097 1059 do {
9ce5646a
MD
1060 health_code_update();
1061
10a50311
JD
1062 ret = lttng_consumer_read_subbuffer(metadata_stream, ctx);
1063 if (ret < 0) {
94d49140 1064 goto error_stream;
10a50311 1065 }
04ef1097 1066 } while (ret > 0);
10a50311 1067
10a50311
JD
1068error_stream:
1069 /*
1070 * Clean up the stream completly because the next snapshot will use a new
1071 * metadata stream.
1072 */
10a50311 1073 consumer_stream_destroy(metadata_stream, NULL);
212d67a2 1074 cds_list_del(&metadata_stream->send_node);
10a50311
JD
1075 metadata_channel->metadata_stream = NULL;
1076
1077error:
1078 rcu_read_unlock();
1079 return ret;
1080}
1081
1082/*
1083 * Take a snapshot of all the stream of a channel.
1084 *
1085 * Returns 0 on success, < 0 on error
1086 */
1087static int snapshot_channel(uint64_t key, char *path, uint64_t relayd_id,
d07ceecd 1088 uint64_t nb_packets_per_stream, struct lttng_consumer_local_data *ctx)
10a50311
JD
1089{
1090 int ret;
1091 unsigned use_relayd = 0;
1092 unsigned long consumed_pos, produced_pos;
1093 struct lttng_consumer_channel *channel;
1094 struct lttng_consumer_stream *stream;
1095
1096 assert(path);
1097 assert(ctx);
1098
1099 rcu_read_lock();
1100
1101 if (relayd_id != (uint64_t) -1ULL) {
1102 use_relayd = 1;
1103 }
1104
1105 channel = consumer_find_channel(key);
1106 if (!channel) {
6a00837f 1107 ERR("UST snapshot channel not found for key %" PRIu64, key);
10a50311
JD
1108 ret = -1;
1109 goto error;
1110 }
1111 assert(!channel->monitor);
6a00837f 1112 DBG("UST consumer snapshot channel %" PRIu64, key);
10a50311
JD
1113
1114 cds_list_for_each_entry(stream, &channel->streams.head, send_node) {
9ce5646a
MD
1115 health_code_update();
1116
10a50311
JD
1117 /* Lock stream because we are about to change its state. */
1118 pthread_mutex_lock(&stream->lock);
1119 stream->net_seq_idx = relayd_id;
1120
1121 if (use_relayd) {
1122 ret = consumer_send_relayd_stream(stream, path);
1123 if (ret < 0) {
1124 goto error_unlock;
1125 }
1126 } else {
1127 ret = utils_create_stream_file(path, stream->name,
1128 stream->chan->tracefile_size,
1129 stream->tracefile_count_current,
309167d2 1130 stream->uid, stream->gid, NULL);
10a50311
JD
1131 if (ret < 0) {
1132 goto error_unlock;
1133 }
1134 stream->out_fd = ret;
1135 stream->tracefile_size_current = 0;
1136
1137 DBG("UST consumer snapshot stream %s/%s (%" PRIu64 ")", path,
1138 stream->name, stream->key);
1139 }
1140
d4d80f77
MD
1141 /*
1142 * If tracing is active, we want to perform a "full" buffer flush.
1143 * Else, if quiescent, it has already been done by the prior stop.
1144 */
1145 if (!stream->quiescent) {
1146 ustctl_flush_buffer(stream->ustream, 0);
1147 }
10a50311
JD
1148
1149 ret = lttng_ustconsumer_take_snapshot(stream);
1150 if (ret < 0) {
1151 ERR("Taking UST snapshot");
1152 goto error_unlock;
1153 }
1154
1155 ret = lttng_ustconsumer_get_produced_snapshot(stream, &produced_pos);
1156 if (ret < 0) {
1157 ERR("Produced UST snapshot position");
1158 goto error_unlock;
1159 }
1160
1161 ret = lttng_ustconsumer_get_consumed_snapshot(stream, &consumed_pos);
1162 if (ret < 0) {
1163 ERR("Consumerd UST snapshot position");
1164 goto error_unlock;
1165 }
1166
5c786ded
JD
1167 /*
1168 * The original value is sent back if max stream size is larger than
d07ceecd 1169 * the possible size of the snapshot. Also, we assume that the session
5c786ded
JD
1170 * daemon should never send a maximum stream size that is lower than
1171 * subbuffer size.
1172 */
d07ceecd
MD
1173 consumed_pos = consumer_get_consume_start_pos(consumed_pos,
1174 produced_pos, nb_packets_per_stream,
1175 stream->max_sb_size);
5c786ded 1176
10a50311
JD
1177 while (consumed_pos < produced_pos) {
1178 ssize_t read_len;
1179 unsigned long len, padded_len;
1180
9ce5646a
MD
1181 health_code_update();
1182
10a50311
JD
1183 DBG("UST consumer taking snapshot at pos %lu", consumed_pos);
1184
1185 ret = ustctl_get_subbuf(stream->ustream, &consumed_pos);
1186 if (ret < 0) {
1187 if (ret != -EAGAIN) {
1188 PERROR("ustctl_get_subbuf snapshot");
1189 goto error_close_stream;
1190 }
1191 DBG("UST consumer get subbuf failed. Skipping it.");
1192 consumed_pos += stream->max_sb_size;
2947da29 1193 stream->chan->lost_packets++;
10a50311
JD
1194 continue;
1195 }
1196
1197 ret = ustctl_get_subbuf_size(stream->ustream, &len);
1198 if (ret < 0) {
1199 ERR("Snapshot ustctl_get_subbuf_size");
1200 goto error_put_subbuf;
1201 }
1202
1203 ret = ustctl_get_padded_subbuf_size(stream->ustream, &padded_len);
1204 if (ret < 0) {
1205 ERR("Snapshot ustctl_get_padded_subbuf_size");
1206 goto error_put_subbuf;
1207 }
1208
1209 read_len = lttng_consumer_on_read_subbuffer_mmap(ctx, stream, len,
309167d2 1210 padded_len - len, NULL);
10a50311
JD
1211 if (use_relayd) {
1212 if (read_len != len) {
56591bac 1213 ret = -EPERM;
10a50311
JD
1214 goto error_put_subbuf;
1215 }
1216 } else {
1217 if (read_len != padded_len) {
56591bac 1218 ret = -EPERM;
10a50311
JD
1219 goto error_put_subbuf;
1220 }
1221 }
1222
1223 ret = ustctl_put_subbuf(stream->ustream);
1224 if (ret < 0) {
1225 ERR("Snapshot ustctl_put_subbuf");
1226 goto error_close_stream;
1227 }
1228 consumed_pos += stream->max_sb_size;
1229 }
1230
1231 /* Simply close the stream so we can use it on the next snapshot. */
1232 consumer_stream_close(stream);
1233 pthread_mutex_unlock(&stream->lock);
1234 }
1235
1236 rcu_read_unlock();
1237 return 0;
1238
1239error_put_subbuf:
1240 if (ustctl_put_subbuf(stream->ustream) < 0) {
1241 ERR("Snapshot ustctl_put_subbuf");
1242 }
1243error_close_stream:
1244 consumer_stream_close(stream);
1245error_unlock:
1246 pthread_mutex_unlock(&stream->lock);
1247error:
1248 rcu_read_unlock();
d88aee68
DG
1249 return ret;
1250}
1251
331744e3 1252/*
c585821b
MD
1253 * Receive the metadata updates from the sessiond. Supports receiving
1254 * overlapping metadata, but is needs to always belong to a contiguous
1255 * range starting from 0.
1256 * Be careful about the locks held when calling this function: it needs
1257 * the metadata cache flush to concurrently progress in order to
1258 * complete.
331744e3
JD
1259 */
1260int lttng_ustconsumer_recv_metadata(int sock, uint64_t key, uint64_t offset,
93ec662e
JD
1261 uint64_t len, uint64_t version,
1262 struct lttng_consumer_channel *channel, int timer, int wait)
331744e3 1263{
0c759fc9 1264 int ret, ret_code = LTTCOMM_CONSUMERD_SUCCESS;
331744e3
JD
1265 char *metadata_str;
1266
8fd623e0 1267 DBG("UST consumer push metadata key %" PRIu64 " of len %" PRIu64, key, len);
331744e3
JD
1268
1269 metadata_str = zmalloc(len * sizeof(char));
1270 if (!metadata_str) {
1271 PERROR("zmalloc metadata string");
1272 ret_code = LTTCOMM_CONSUMERD_ENOMEM;
1273 goto end;
1274 }
1275
9ce5646a
MD
1276 health_code_update();
1277
331744e3
JD
1278 /* Receive metadata string. */
1279 ret = lttcomm_recv_unix_sock(sock, metadata_str, len);
1280 if (ret < 0) {
1281 /* Session daemon is dead so return gracefully. */
1282 ret_code = ret;
1283 goto end_free;
1284 }
1285
9ce5646a
MD
1286 health_code_update();
1287
331744e3 1288 pthread_mutex_lock(&channel->metadata_cache->lock);
93ec662e
JD
1289 ret = consumer_metadata_cache_write(channel, offset, len, version,
1290 metadata_str);
331744e3
JD
1291 if (ret < 0) {
1292 /* Unable to handle metadata. Notify session daemon. */
1293 ret_code = LTTCOMM_CONSUMERD_ERROR_METADATA;
a32bd775
DG
1294 /*
1295 * Skip metadata flush on write error since the offset and len might
1296 * not have been updated which could create an infinite loop below when
1297 * waiting for the metadata cache to be flushed.
1298 */
1299 pthread_mutex_unlock(&channel->metadata_cache->lock);
a32bd775 1300 goto end_free;
331744e3
JD
1301 }
1302 pthread_mutex_unlock(&channel->metadata_cache->lock);
1303
94d49140
JD
1304 if (!wait) {
1305 goto end_free;
1306 }
5e41ebe1 1307 while (consumer_metadata_cache_flushed(channel, offset + len, timer)) {
331744e3 1308 DBG("Waiting for metadata to be flushed");
9ce5646a
MD
1309
1310 health_code_update();
1311
331744e3
JD
1312 usleep(DEFAULT_METADATA_AVAILABILITY_WAIT_TIME);
1313 }
1314
1315end_free:
1316 free(metadata_str);
1317end:
1318 return ret_code;
1319}
1320
4cbc1a04
DG
1321/*
1322 * Receive command from session daemon and process it.
1323 *
1324 * Return 1 on success else a negative value or 0.
1325 */
3bd1e081
MD
1326int lttng_ustconsumer_recv_cmd(struct lttng_consumer_local_data *ctx,
1327 int sock, struct pollfd *consumer_sockpoll)
1328{
1329 ssize_t ret;
0c759fc9 1330 enum lttcomm_return_code ret_code = LTTCOMM_CONSUMERD_SUCCESS;
3bd1e081 1331 struct lttcomm_consumer_msg msg;
ffe60014 1332 struct lttng_consumer_channel *channel = NULL;
3bd1e081 1333
9ce5646a
MD
1334 health_code_update();
1335
3bd1e081
MD
1336 ret = lttcomm_recv_unix_sock(sock, &msg, sizeof(msg));
1337 if (ret != sizeof(msg)) {
173af62f
DG
1338 DBG("Consumer received unexpected message size %zd (expects %zu)",
1339 ret, sizeof(msg));
3be74084
DG
1340 /*
1341 * The ret value might 0 meaning an orderly shutdown but this is ok
1342 * since the caller handles this.
1343 */
489f70e9 1344 if (ret > 0) {
c6857fcf 1345 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_ERROR_RECV_CMD);
489f70e9
MD
1346 ret = -1;
1347 }
3bd1e081
MD
1348 return ret;
1349 }
9ce5646a
MD
1350
1351 health_code_update();
1352
84382d49
MD
1353 /* deprecated */
1354 assert(msg.cmd_type != LTTNG_CONSUMER_STOP);
3bd1e081 1355
9ce5646a
MD
1356 health_code_update();
1357
3f8e211f 1358 /* relayd needs RCU read-side lock */
b0b335c8
MD
1359 rcu_read_lock();
1360
3bd1e081 1361 switch (msg.cmd_type) {
00e2e675
DG
1362 case LTTNG_CONSUMER_ADD_RELAYD_SOCKET:
1363 {
f50f23d9 1364 /* Session daemon status message are handled in the following call. */
3ab4ee7d 1365 consumer_add_relayd_socket(msg.u.relayd_sock.net_index,
7735ef9e 1366 msg.u.relayd_sock.type, ctx, sock, consumer_sockpoll,
d3e2ba59
JD
1367 &msg.u.relayd_sock.sock, msg.u.relayd_sock.session_id,
1368 msg.u.relayd_sock.relayd_session_id);
00e2e675
DG
1369 goto end_nosignal;
1370 }
173af62f
DG
1371 case LTTNG_CONSUMER_DESTROY_RELAYD:
1372 {
a6ba4fe1 1373 uint64_t index = msg.u.destroy_relayd.net_seq_idx;
173af62f
DG
1374 struct consumer_relayd_sock_pair *relayd;
1375
a6ba4fe1 1376 DBG("UST consumer destroying relayd %" PRIu64, index);
173af62f
DG
1377
1378 /* Get relayd reference if exists. */
a6ba4fe1 1379 relayd = consumer_find_relayd(index);
173af62f 1380 if (relayd == NULL) {
3448e266 1381 DBG("Unable to find relayd %" PRIu64, index);
e462382a 1382 ret_code = LTTCOMM_CONSUMERD_RELAYD_FAIL;
173af62f
DG
1383 }
1384
a6ba4fe1
DG
1385 /*
1386 * Each relayd socket pair has a refcount of stream attached to it
1387 * which tells if the relayd is still active or not depending on the
1388 * refcount value.
1389 *
1390 * This will set the destroy flag of the relayd object and destroy it
1391 * if the refcount reaches zero when called.
1392 *
1393 * The destroy can happen either here or when a stream fd hangs up.
1394 */
f50f23d9
DG
1395 if (relayd) {
1396 consumer_flag_relayd_for_destroy(relayd);
1397 }
1398
d88aee68 1399 goto end_msg_sessiond;
173af62f 1400 }
3bd1e081
MD
1401 case LTTNG_CONSUMER_UPDATE_STREAM:
1402 {
3f8e211f 1403 rcu_read_unlock();
7ad0a0cb 1404 return -ENOSYS;
3bd1e081 1405 }
6d805429 1406 case LTTNG_CONSUMER_DATA_PENDING:
53632229 1407 {
3be74084 1408 int ret, is_data_pending;
6d805429 1409 uint64_t id = msg.u.data_pending.session_id;
ca22feea 1410
6d805429 1411 DBG("UST consumer data pending command for id %" PRIu64, id);
ca22feea 1412
3be74084 1413 is_data_pending = consumer_data_pending(id);
ca22feea
DG
1414
1415 /* Send back returned value to session daemon */
3be74084
DG
1416 ret = lttcomm_send_unix_sock(sock, &is_data_pending,
1417 sizeof(is_data_pending));
ca22feea 1418 if (ret < 0) {
3be74084 1419 DBG("Error when sending the data pending ret code: %d", ret);
489f70e9 1420 goto error_fatal;
ca22feea 1421 }
f50f23d9
DG
1422
1423 /*
1424 * No need to send back a status message since the data pending
1425 * returned value is the response.
1426 */
ca22feea 1427 break;
53632229 1428 }
ffe60014
DG
1429 case LTTNG_CONSUMER_ASK_CHANNEL_CREATION:
1430 {
1431 int ret;
1432 struct ustctl_consumer_channel_attr attr;
1433
1434 /* Create a plain object and reserve a channel key. */
1435 channel = allocate_channel(msg.u.ask_channel.session_id,
1436 msg.u.ask_channel.pathname, msg.u.ask_channel.name,
1437 msg.u.ask_channel.uid, msg.u.ask_channel.gid,
1438 msg.u.ask_channel.relayd_id, msg.u.ask_channel.key,
1624d5b7
JD
1439 (enum lttng_event_output) msg.u.ask_channel.output,
1440 msg.u.ask_channel.tracefile_size,
2bba9e53 1441 msg.u.ask_channel.tracefile_count,
1950109e 1442 msg.u.ask_channel.session_id_per_pid,
ecc48a90 1443 msg.u.ask_channel.monitor,
d7ba1388 1444 msg.u.ask_channel.live_timer_interval,
3d071855 1445 msg.u.ask_channel.root_shm_path,
d7ba1388 1446 msg.u.ask_channel.shm_path);
ffe60014
DG
1447 if (!channel) {
1448 goto end_channel_error;
1449 }
1450
567eb353
DG
1451 /*
1452 * Assign UST application UID to the channel. This value is ignored for
1453 * per PID buffers. This is specific to UST thus setting this after the
1454 * allocation.
1455 */
1456 channel->ust_app_uid = msg.u.ask_channel.ust_app_uid;
1457
ffe60014
DG
1458 /* Build channel attributes from received message. */
1459 attr.subbuf_size = msg.u.ask_channel.subbuf_size;
1460 attr.num_subbuf = msg.u.ask_channel.num_subbuf;
1461 attr.overwrite = msg.u.ask_channel.overwrite;
1462 attr.switch_timer_interval = msg.u.ask_channel.switch_timer_interval;
1463 attr.read_timer_interval = msg.u.ask_channel.read_timer_interval;
7972aab2 1464 attr.chan_id = msg.u.ask_channel.chan_id;
ffe60014 1465 memcpy(attr.uuid, msg.u.ask_channel.uuid, sizeof(attr.uuid));
f515d318 1466 attr.blocking_timeout= msg.u.ask_channel.blocking_timeout;
ffe60014 1467
0c759fc9
DG
1468 /* Match channel buffer type to the UST abi. */
1469 switch (msg.u.ask_channel.output) {
1470 case LTTNG_EVENT_MMAP:
1471 default:
1472 attr.output = LTTNG_UST_MMAP;
1473 break;
1474 }
1475
ffe60014
DG
1476 /* Translate and save channel type. */
1477 switch (msg.u.ask_channel.type) {
1478 case LTTNG_UST_CHAN_PER_CPU:
1479 channel->type = CONSUMER_CHANNEL_TYPE_DATA;
1480 attr.type = LTTNG_UST_CHAN_PER_CPU;
8633d6e3
MD
1481 /*
1482 * Set refcount to 1 for owner. Below, we will
1483 * pass ownership to the
1484 * consumer_thread_channel_poll() thread.
1485 */
1486 channel->refcount = 1;
ffe60014
DG
1487 break;
1488 case LTTNG_UST_CHAN_METADATA:
1489 channel->type = CONSUMER_CHANNEL_TYPE_METADATA;
1490 attr.type = LTTNG_UST_CHAN_METADATA;
1491 break;
1492 default:
1493 assert(0);
1494 goto error_fatal;
1495 };
1496
9ce5646a
MD
1497 health_code_update();
1498
ffe60014
DG
1499 ret = ask_channel(ctx, sock, channel, &attr);
1500 if (ret < 0) {
1501 goto end_channel_error;
1502 }
1503
fc643247
MD
1504 if (msg.u.ask_channel.type == LTTNG_UST_CHAN_METADATA) {
1505 ret = consumer_metadata_cache_allocate(channel);
1506 if (ret < 0) {
1507 ERR("Allocating metadata cache");
1508 goto end_channel_error;
1509 }
1510 consumer_timer_switch_start(channel, attr.switch_timer_interval);
1511 attr.switch_timer_interval = 0;
94d49140 1512 } else {
e9404c27
JG
1513 int monitor_start_ret;
1514
94d49140
JD
1515 consumer_timer_live_start(channel,
1516 msg.u.ask_channel.live_timer_interval);
e9404c27
JG
1517 monitor_start_ret = consumer_timer_monitor_start(
1518 channel,
1519 msg.u.ask_channel.monitor_timer_interval);
1520 if (monitor_start_ret < 0) {
1521 ERR("Starting channel monitoring timer failed");
1522 goto end_channel_error;
1523 }
fc643247
MD
1524 }
1525
9ce5646a
MD
1526 health_code_update();
1527
ffe60014
DG
1528 /*
1529 * Add the channel to the internal state AFTER all streams were created
1530 * and successfully sent to session daemon. This way, all streams must
1531 * be ready before this channel is visible to the threads.
fc643247
MD
1532 * If add_channel succeeds, ownership of the channel is
1533 * passed to consumer_thread_channel_poll().
ffe60014
DG
1534 */
1535 ret = add_channel(channel, ctx);
1536 if (ret < 0) {
ea88ca2a
MD
1537 if (msg.u.ask_channel.type == LTTNG_UST_CHAN_METADATA) {
1538 if (channel->switch_timer_enabled == 1) {
1539 consumer_timer_switch_stop(channel);
1540 }
1541 consumer_metadata_cache_destroy(channel);
1542 }
d3e2ba59
JD
1543 if (channel->live_timer_enabled == 1) {
1544 consumer_timer_live_stop(channel);
1545 }
e9404c27
JG
1546 if (channel->monitor_timer_enabled == 1) {
1547 consumer_timer_monitor_stop(channel);
1548 }
ffe60014
DG
1549 goto end_channel_error;
1550 }
1551
9ce5646a
MD
1552 health_code_update();
1553
ffe60014
DG
1554 /*
1555 * Channel and streams are now created. Inform the session daemon that
1556 * everything went well and should wait to receive the channel and
1557 * streams with ustctl API.
1558 */
1559 ret = consumer_send_status_channel(sock, channel);
1560 if (ret < 0) {
1561 /*
489f70e9 1562 * There is probably a problem on the socket.
ffe60014 1563 */
489f70e9 1564 goto error_fatal;
ffe60014
DG
1565 }
1566
1567 break;
1568 }
1569 case LTTNG_CONSUMER_GET_CHANNEL:
1570 {
1571 int ret, relayd_err = 0;
d88aee68 1572 uint64_t key = msg.u.get_channel.key;
ffe60014 1573 struct lttng_consumer_channel *channel;
ffe60014
DG
1574
1575 channel = consumer_find_channel(key);
1576 if (!channel) {
8fd623e0 1577 ERR("UST consumer get channel key %" PRIu64 " not found", key);
e462382a 1578 ret_code = LTTCOMM_CONSUMERD_CHAN_NOT_FOUND;
ffe60014
DG
1579 goto end_msg_sessiond;
1580 }
1581
9ce5646a
MD
1582 health_code_update();
1583
ffe60014
DG
1584 /* Send everything to sessiond. */
1585 ret = send_sessiond_channel(sock, channel, ctx, &relayd_err);
1586 if (ret < 0) {
1587 if (relayd_err) {
1588 /*
1589 * We were unable to send to the relayd the stream so avoid
1590 * sending back a fatal error to the thread since this is OK
f2a444f1
DG
1591 * and the consumer can continue its work. The above call
1592 * has sent the error status message to the sessiond.
ffe60014 1593 */
f2a444f1 1594 goto end_nosignal;
ffe60014
DG
1595 }
1596 /*
1597 * The communicaton was broken hence there is a bad state between
1598 * the consumer and sessiond so stop everything.
1599 */
1600 goto error_fatal;
1601 }
1602
9ce5646a
MD
1603 health_code_update();
1604
10a50311
JD
1605 /*
1606 * In no monitor mode, the streams ownership is kept inside the channel
1607 * so don't send them to the data thread.
1608 */
1609 if (!channel->monitor) {
1610 goto end_msg_sessiond;
1611 }
1612
d88aee68
DG
1613 ret = send_streams_to_thread(channel, ctx);
1614 if (ret < 0) {
1615 /*
1616 * If we are unable to send the stream to the thread, there is
1617 * a big problem so just stop everything.
1618 */
1619 goto error_fatal;
ffe60014 1620 }
ffe60014
DG
1621 /* List MUST be empty after or else it could be reused. */
1622 assert(cds_list_empty(&channel->streams.head));
d88aee68
DG
1623 goto end_msg_sessiond;
1624 }
1625 case LTTNG_CONSUMER_DESTROY_CHANNEL:
1626 {
1627 uint64_t key = msg.u.destroy_channel.key;
d88aee68 1628
a0cbdd2e
MD
1629 /*
1630 * Only called if streams have not been sent to stream
1631 * manager thread. However, channel has been sent to
1632 * channel manager thread.
1633 */
1634 notify_thread_del_channel(ctx, key);
d88aee68 1635 goto end_msg_sessiond;
ffe60014 1636 }
d88aee68
DG
1637 case LTTNG_CONSUMER_CLOSE_METADATA:
1638 {
1639 int ret;
1640
1641 ret = close_metadata(msg.u.close_metadata.key);
1642 if (ret != 0) {
1643 ret_code = ret;
1644 }
1645
1646 goto end_msg_sessiond;
1647 }
7972aab2
DG
1648 case LTTNG_CONSUMER_FLUSH_CHANNEL:
1649 {
1650 int ret;
1651
1652 ret = flush_channel(msg.u.flush_channel.key);
1653 if (ret != 0) {
1654 ret_code = ret;
1655 }
1656
1657 goto end_msg_sessiond;
1658 }
0dd01979
MD
1659 case LTTNG_CONSUMER_CLEAR_QUIESCENT_CHANNEL:
1660 {
1661 int ret;
1662
1663 ret = clear_quiescent_channel(
1664 msg.u.clear_quiescent_channel.key);
1665 if (ret != 0) {
1666 ret_code = ret;
1667 }
1668
1669 goto end_msg_sessiond;
1670 }
d88aee68 1671 case LTTNG_CONSUMER_PUSH_METADATA:
ffe60014
DG
1672 {
1673 int ret;
d88aee68 1674 uint64_t len = msg.u.push_metadata.len;
d88aee68 1675 uint64_t key = msg.u.push_metadata.key;
331744e3 1676 uint64_t offset = msg.u.push_metadata.target_offset;
93ec662e 1677 uint64_t version = msg.u.push_metadata.version;
ffe60014
DG
1678 struct lttng_consumer_channel *channel;
1679
8fd623e0
DG
1680 DBG("UST consumer push metadata key %" PRIu64 " of len %" PRIu64, key,
1681 len);
ffe60014
DG
1682
1683 channel = consumer_find_channel(key);
1684 if (!channel) {
000baf6a
DG
1685 /*
1686 * This is possible if the metadata creation on the consumer side
1687 * is in flight vis-a-vis a concurrent push metadata from the
1688 * session daemon. Simply return that the channel failed and the
1689 * session daemon will handle that message correctly considering
1690 * that this race is acceptable thus the DBG() statement here.
1691 */
1692 DBG("UST consumer push metadata %" PRIu64 " not found", key);
1693 ret_code = LTTCOMM_CONSUMERD_CHANNEL_FAIL;
4a2eb0ca 1694 goto end_msg_sessiond;
d88aee68
DG
1695 }
1696
9ce5646a
MD
1697 health_code_update();
1698
c585821b
MD
1699 if (!len) {
1700 /*
1701 * There is nothing to receive. We have simply
1702 * checked whether the channel can be found.
1703 */
1704 ret_code = LTTCOMM_CONSUMERD_SUCCESS;
1705 goto end_msg_sessiond;
1706 }
1707
d88aee68 1708 /* Tell session daemon we are ready to receive the metadata. */
0c759fc9 1709 ret = consumer_send_status_msg(sock, LTTCOMM_CONSUMERD_SUCCESS);
ffe60014
DG
1710 if (ret < 0) {
1711 /* Somehow, the session daemon is not responding anymore. */
d88aee68
DG
1712 goto error_fatal;
1713 }
1714
9ce5646a
MD
1715 health_code_update();
1716
d88aee68 1717 /* Wait for more data. */
9ce5646a
MD
1718 health_poll_entry();
1719 ret = lttng_consumer_poll_socket(consumer_sockpoll);
1720 health_poll_exit();
84382d49 1721 if (ret) {
489f70e9 1722 goto error_fatal;
d88aee68
DG
1723 }
1724
9ce5646a
MD
1725 health_code_update();
1726
331744e3 1727 ret = lttng_ustconsumer_recv_metadata(sock, key, offset,
93ec662e 1728 len, version, channel, 0, 1);
d88aee68 1729 if (ret < 0) {
331744e3 1730 /* error receiving from sessiond */
489f70e9 1731 goto error_fatal;
331744e3
JD
1732 } else {
1733 ret_code = ret;
d88aee68
DG
1734 goto end_msg_sessiond;
1735 }
d88aee68
DG
1736 }
1737 case LTTNG_CONSUMER_SETUP_METADATA:
1738 {
1739 int ret;
1740
1741 ret = setup_metadata(ctx, msg.u.setup_metadata.key);
1742 if (ret) {
1743 ret_code = ret;
1744 }
1745 goto end_msg_sessiond;
ffe60014 1746 }
6dc3064a
DG
1747 case LTTNG_CONSUMER_SNAPSHOT_CHANNEL:
1748 {
10a50311
JD
1749 if (msg.u.snapshot_channel.metadata) {
1750 ret = snapshot_metadata(msg.u.snapshot_channel.key,
1751 msg.u.snapshot_channel.pathname,
1752 msg.u.snapshot_channel.relayd_id,
1753 ctx);
1754 if (ret < 0) {
1755 ERR("Snapshot metadata failed");
e462382a 1756 ret_code = LTTCOMM_CONSUMERD_ERROR_METADATA;
10a50311
JD
1757 }
1758 } else {
1759 ret = snapshot_channel(msg.u.snapshot_channel.key,
1760 msg.u.snapshot_channel.pathname,
1761 msg.u.snapshot_channel.relayd_id,
d07ceecd 1762 msg.u.snapshot_channel.nb_packets_per_stream,
10a50311
JD
1763 ctx);
1764 if (ret < 0) {
1765 ERR("Snapshot channel failed");
e462382a 1766 ret_code = LTTCOMM_CONSUMERD_CHANNEL_FAIL;
10a50311
JD
1767 }
1768 }
1769
9ce5646a 1770 health_code_update();
6dc3064a
DG
1771 ret = consumer_send_status_msg(sock, ret_code);
1772 if (ret < 0) {
1773 /* Somehow, the session daemon is not responding anymore. */
1774 goto end_nosignal;
1775 }
9ce5646a 1776 health_code_update();
6dc3064a
DG
1777 break;
1778 }
fb83fe64
JD
1779 case LTTNG_CONSUMER_DISCARDED_EVENTS:
1780 {
beb59458
MJ
1781 int ret = 0;
1782 uint64_t discarded_events;
fb83fe64
JD
1783 struct lttng_ht_iter iter;
1784 struct lttng_ht *ht;
1785 struct lttng_consumer_stream *stream;
1786 uint64_t id = msg.u.discarded_events.session_id;
1787 uint64_t key = msg.u.discarded_events.channel_key;
1788
1789 DBG("UST consumer discarded events command for session id %"
1790 PRIu64, id);
1791 rcu_read_lock();
1792 pthread_mutex_lock(&consumer_data.lock);
1793
1794 ht = consumer_data.stream_list_ht;
1795
1796 /*
1797 * We only need a reference to the channel, but they are not
1798 * directly indexed, so we just use the first matching stream
1799 * to extract the information we need, we default to 0 if not
1800 * found (no events are dropped if the channel is not yet in
1801 * use).
1802 */
beb59458 1803 discarded_events = 0;
fb83fe64
JD
1804 cds_lfht_for_each_entry_duplicate(ht->ht,
1805 ht->hash_fct(&id, lttng_ht_seed),
1806 ht->match_fct, &id,
1807 &iter.iter, stream, node_session_id.node) {
1808 if (stream->chan->key == key) {
beb59458 1809 discarded_events = stream->chan->discarded_events;
fb83fe64
JD
1810 break;
1811 }
1812 }
1813 pthread_mutex_unlock(&consumer_data.lock);
1814 rcu_read_unlock();
1815
1816 DBG("UST consumer discarded events command for session id %"
1817 PRIu64 ", channel key %" PRIu64, id, key);
1818
1819 health_code_update();
1820
1821 /* Send back returned value to session daemon */
beb59458 1822 ret = lttcomm_send_unix_sock(sock, &discarded_events, sizeof(discarded_events));
fb83fe64
JD
1823 if (ret < 0) {
1824 PERROR("send discarded events");
1825 goto error_fatal;
1826 }
1827
1828 break;
1829 }
1830 case LTTNG_CONSUMER_LOST_PACKETS:
1831 {
9a06e8d4
JG
1832 int ret;
1833 uint64_t lost_packets;
fb83fe64
JD
1834 struct lttng_ht_iter iter;
1835 struct lttng_ht *ht;
1836 struct lttng_consumer_stream *stream;
1837 uint64_t id = msg.u.lost_packets.session_id;
1838 uint64_t key = msg.u.lost_packets.channel_key;
1839
1840 DBG("UST consumer lost packets command for session id %"
1841 PRIu64, id);
1842 rcu_read_lock();
1843 pthread_mutex_lock(&consumer_data.lock);
1844
1845 ht = consumer_data.stream_list_ht;
1846
1847 /*
1848 * We only need a reference to the channel, but they are not
1849 * directly indexed, so we just use the first matching stream
1850 * to extract the information we need, we default to 0 if not
1851 * found (no packets lost if the channel is not yet in use).
1852 */
9a06e8d4 1853 lost_packets = 0;
fb83fe64
JD
1854 cds_lfht_for_each_entry_duplicate(ht->ht,
1855 ht->hash_fct(&id, lttng_ht_seed),
1856 ht->match_fct, &id,
1857 &iter.iter, stream, node_session_id.node) {
1858 if (stream->chan->key == key) {
9a06e8d4 1859 lost_packets = stream->chan->lost_packets;
fb83fe64
JD
1860 break;
1861 }
1862 }
1863 pthread_mutex_unlock(&consumer_data.lock);
1864 rcu_read_unlock();
1865
1866 DBG("UST consumer lost packets command for session id %"
1867 PRIu64 ", channel key %" PRIu64, id, key);
1868
1869 health_code_update();
1870
1871 /* Send back returned value to session daemon */
9a06e8d4
JG
1872 ret = lttcomm_send_unix_sock(sock, &lost_packets,
1873 sizeof(lost_packets));
fb83fe64
JD
1874 if (ret < 0) {
1875 PERROR("send lost packets");
1876 goto error_fatal;
1877 }
1878
1879 break;
1880 }
b3530820
JG
1881 case LTTNG_CONSUMER_SET_CHANNEL_MONITOR_PIPE:
1882 {
1883 int channel_monitor_pipe;
1884
1885 ret_code = LTTCOMM_CONSUMERD_SUCCESS;
1886 /* Successfully received the command's type. */
1887 ret = consumer_send_status_msg(sock, ret_code);
1888 if (ret < 0) {
1889 goto error_fatal;
1890 }
1891
1892 ret = lttcomm_recv_fds_unix_sock(sock, &channel_monitor_pipe,
1893 1);
1894 if (ret != sizeof(channel_monitor_pipe)) {
1895 ERR("Failed to receive channel monitor pipe");
1896 goto error_fatal;
1897 }
1898
1899 DBG("Received channel monitor pipe (%d)", channel_monitor_pipe);
1900 ret = consumer_timer_thread_set_channel_monitor_pipe(
1901 channel_monitor_pipe);
1902 if (!ret) {
1903 int flags;
1904
1905 ret_code = LTTCOMM_CONSUMERD_SUCCESS;
1906 /* Set the pipe as non-blocking. */
1907 ret = fcntl(channel_monitor_pipe, F_GETFL, 0);
1908 if (ret == -1) {
1909 PERROR("fcntl get flags of the channel monitoring pipe");
1910 goto error_fatal;
1911 }
1912 flags = ret;
1913
1914 ret = fcntl(channel_monitor_pipe, F_SETFL,
1915 flags | O_NONBLOCK);
1916 if (ret == -1) {
1917 PERROR("fcntl set O_NONBLOCK flag of the channel monitoring pipe");
1918 goto error_fatal;
1919 }
1920 DBG("Channel monitor pipe set as non-blocking");
1921 } else {
1922 ret_code = LTTCOMM_CONSUMERD_ALREADY_SET;
1923 }
1924 goto end_msg_sessiond;
1925 }
e1f42159
JR
1926 case LTTNG_CONSUMER_CLEAR_CHANNEL:
1927 {
1928 struct lttng_consumer_channel *channel;
1929 uint64_t key = msg.u.clear_channel.key;
1930
1931 channel = consumer_find_channel(key);
1932 if (!channel) {
1933 DBG("Channel %" PRIu64 " not found", key);
1934 ret_code = LTTCOMM_CONSUMERD_CHAN_NOT_FOUND;
1935 } else {
1936 ret = lttng_consumer_clear_channel(channel);
1937 if (ret) {
4b534b8b 1938 ERR("Clear channel failed key %" PRIu64, key);
e1f42159
JR
1939 ret_code = ret;
1940 }
1941
1942 health_code_update();
1943 }
1944 ret = consumer_send_status_msg(sock, ret_code);
1945 if (ret < 0) {
1946 /* Somehow, the session daemon is not responding anymore. */
1947 goto end_nosignal;
1948 }
1949 break;
1950 }
3f505e4b
MD
1951 case LTTNG_CONSUMER_CLEAR_SESSION:
1952 {
1953 uint64_t session_id = msg.u.clear_session.session_id;
1954
1955 ret = lttng_consumer_clear_session(session_id);
1956 if (ret) {
1957 ERR("Clear session failed session_id %" PRIu64, session_id);
1958 ret_code = ret;
1959 }
1960
1961 health_code_update();
1962 ret = consumer_send_status_msg(sock, ret_code);
1963 if (ret < 0) {
1964 /* Somehow, the session daemon is not responding anymore. */
1965 goto end_nosignal;
1966 }
1967 break;
1968 }
1969
3bd1e081
MD
1970 default:
1971 break;
1972 }
3f8e211f 1973
3bd1e081 1974end_nosignal:
b0b335c8 1975 rcu_read_unlock();
4cbc1a04 1976
9ce5646a
MD
1977 health_code_update();
1978
4cbc1a04
DG
1979 /*
1980 * Return 1 to indicate success since the 0 value can be a socket
1981 * shutdown during the recv() or send() call.
1982 */
1983 return 1;
ffe60014
DG
1984
1985end_msg_sessiond:
1986 /*
1987 * The returned value here is not useful since either way we'll return 1 to
1988 * the caller because the session daemon socket management is done
1989 * elsewhere. Returning a negative code or 0 will shutdown the consumer.
1990 */
489f70e9
MD
1991 ret = consumer_send_status_msg(sock, ret_code);
1992 if (ret < 0) {
1993 goto error_fatal;
1994 }
ffe60014 1995 rcu_read_unlock();
9ce5646a
MD
1996
1997 health_code_update();
1998
ffe60014
DG
1999 return 1;
2000end_channel_error:
2001 if (channel) {
2002 /*
2003 * Free channel here since no one has a reference to it. We don't
2004 * free after that because a stream can store this pointer.
2005 */
2006 destroy_channel(channel);
2007 }
2008 /* We have to send a status channel message indicating an error. */
2009 ret = consumer_send_status_channel(sock, NULL);
2010 if (ret < 0) {
2011 /* Stop everything if session daemon can not be notified. */
2012 goto error_fatal;
2013 }
2014 rcu_read_unlock();
9ce5646a
MD
2015
2016 health_code_update();
2017
ffe60014
DG
2018 return 1;
2019error_fatal:
2020 rcu_read_unlock();
2021 /* This will issue a consumer stop. */
2022 return -1;
3bd1e081
MD
2023}
2024
ffe60014
DG
2025/*
2026 * Wrapper over the mmap() read offset from ust-ctl library. Since this can be
2027 * compiled out, we isolate it in this library.
2028 */
2029int lttng_ustctl_get_mmap_read_offset(struct lttng_consumer_stream *stream,
2030 unsigned long *off)
3bd1e081 2031{
ffe60014
DG
2032 assert(stream);
2033 assert(stream->ustream);
b5c5fc29 2034
ffe60014 2035 return ustctl_get_mmap_read_offset(stream->ustream, off);
3bd1e081
MD
2036}
2037
ffe60014
DG
2038/*
2039 * Wrapper over the mmap() read offset from ust-ctl library. Since this can be
2040 * compiled out, we isolate it in this library.
2041 */
2042void *lttng_ustctl_get_mmap_base(struct lttng_consumer_stream *stream)
d056b477 2043{
ffe60014
DG
2044 assert(stream);
2045 assert(stream->ustream);
2046
2047 return ustctl_get_mmap_base(stream->ustream);
d056b477
MD
2048}
2049
ffe60014 2050/*
e9404c27 2051 * Take a snapshot for a specific stream.
ffe60014
DG
2052 *
2053 * Returns 0 on success, < 0 on error
2054 */
2055int lttng_ustconsumer_take_snapshot(struct lttng_consumer_stream *stream)
3bd1e081 2056{
ffe60014
DG
2057 assert(stream);
2058 assert(stream->ustream);
2059
2060 return ustctl_snapshot(stream->ustream);
3bd1e081
MD
2061}
2062
e9404c27
JG
2063/*
2064 * Sample consumed and produced positions for a specific stream.
2065 *
2066 * Returns 0 on success, < 0 on error.
2067 */
2068int lttng_ustconsumer_sample_snapshot_positions(
2069 struct lttng_consumer_stream *stream)
2070{
2071 assert(stream);
2072 assert(stream->ustream);
2073
2074 return ustctl_snapshot_sample_positions(stream->ustream);
2075}
2076
ffe60014
DG
2077/*
2078 * Get the produced position
2079 *
2080 * Returns 0 on success, < 0 on error
2081 */
2082int lttng_ustconsumer_get_produced_snapshot(
2083 struct lttng_consumer_stream *stream, unsigned long *pos)
3bd1e081 2084{
ffe60014
DG
2085 assert(stream);
2086 assert(stream->ustream);
2087 assert(pos);
7a57cf92 2088
ffe60014
DG
2089 return ustctl_snapshot_get_produced(stream->ustream, pos);
2090}
7a57cf92 2091
10a50311
JD
2092/*
2093 * Get the consumed position
2094 *
2095 * Returns 0 on success, < 0 on error
2096 */
2097int lttng_ustconsumer_get_consumed_snapshot(
2098 struct lttng_consumer_stream *stream, unsigned long *pos)
2099{
2100 assert(stream);
2101 assert(stream->ustream);
2102 assert(pos);
2103
2104 return ustctl_snapshot_get_consumed(stream->ustream, pos);
2105}
2106
84a182ce
DG
2107void lttng_ustconsumer_flush_buffer(struct lttng_consumer_stream *stream,
2108 int producer)
2109{
2110 assert(stream);
2111 assert(stream->ustream);
2112
2113 ustctl_flush_buffer(stream->ustream, producer);
2114}
2115
087b053b
JR
2116void lttng_ustconsumer_clear_buffer(struct lttng_consumer_stream *stream)
2117{
2118 assert(stream);
2119 assert(stream->ustream);
2120
2121 ustctl_clear_buffer(stream->ustream);
2122}
2123
84a182ce
DG
2124int lttng_ustconsumer_get_current_timestamp(
2125 struct lttng_consumer_stream *stream, uint64_t *ts)
2126{
2127 assert(stream);
2128 assert(stream->ustream);
2129 assert(ts);
2130
2131 return ustctl_get_current_timestamp(stream->ustream, ts);
2132}
2133
fb83fe64
JD
2134int lttng_ustconsumer_get_sequence_number(
2135 struct lttng_consumer_stream *stream, uint64_t *seq)
2136{
2137 assert(stream);
2138 assert(stream->ustream);
2139 assert(seq);
2140
2141 return ustctl_get_sequence_number(stream->ustream, seq);
2142}
2143
ffe60014 2144/*
0dd01979 2145 * Called when the stream signals the consumer that it has hung up.
ffe60014
DG
2146 */
2147void lttng_ustconsumer_on_stream_hangup(struct lttng_consumer_stream *stream)
2148{
2149 assert(stream);
2150 assert(stream->ustream);
2c1dd183 2151
0dd01979
MD
2152 pthread_mutex_lock(&stream->lock);
2153 if (!stream->quiescent) {
2154 ustctl_flush_buffer(stream->ustream, 0);
2155 stream->quiescent = true;
2156 }
2157 pthread_mutex_unlock(&stream->lock);
ffe60014
DG
2158 stream->hangup_flush_done = 1;
2159}
ee77a7b0 2160
ffe60014
DG
2161void lttng_ustconsumer_del_channel(struct lttng_consumer_channel *chan)
2162{
4628484a
MD
2163 int i;
2164
ffe60014
DG
2165 assert(chan);
2166 assert(chan->uchan);
e316aad5 2167
ea88ca2a
MD
2168 if (chan->switch_timer_enabled == 1) {
2169 consumer_timer_switch_stop(chan);
2170 }
4628484a
MD
2171 for (i = 0; i < chan->nr_stream_fds; i++) {
2172 int ret;
2173
2174 ret = close(chan->stream_fds[i]);
2175 if (ret) {
2176 PERROR("close");
2177 }
2178 if (chan->shm_path[0]) {
2179 char shm_path[PATH_MAX];
2180
2181 ret = get_stream_shm_path(shm_path, chan->shm_path, i);
2182 if (ret) {
2183 ERR("Cannot get stream shm path");
2184 }
2185 ret = run_as_unlink(shm_path, chan->uid, chan->gid);
2186 if (ret) {
4628484a
MD
2187 PERROR("unlink %s", shm_path);
2188 }
2189 }
2190 }
3bd1e081
MD
2191}
2192
b83e03c4
MD
2193void lttng_ustconsumer_free_channel(struct lttng_consumer_channel *chan)
2194{
2195 assert(chan);
2196 assert(chan->uchan);
2197
2198 consumer_metadata_cache_destroy(chan);
2199 ustctl_destroy_channel(chan->uchan);
ea853771
JR
2200 /* Try to rmdir all directories under shm_path root. */
2201 if (chan->root_shm_path[0]) {
602766ec 2202 (void) run_as_rmdir_recursive(chan->root_shm_path,
ea853771
JR
2203 chan->uid, chan->gid);
2204 }
b83e03c4
MD
2205 free(chan->stream_fds);
2206}
2207
3bd1e081
MD
2208void lttng_ustconsumer_del_stream(struct lttng_consumer_stream *stream)
2209{
ffe60014
DG
2210 assert(stream);
2211 assert(stream->ustream);
d41f73b7 2212
ea88ca2a
MD
2213 if (stream->chan->switch_timer_enabled == 1) {
2214 consumer_timer_switch_stop(stream->chan);
2215 }
ffe60014
DG
2216 ustctl_destroy_stream(stream->ustream);
2217}
d41f73b7 2218
6d574024
DG
2219int lttng_ustconsumer_get_wakeup_fd(struct lttng_consumer_stream *stream)
2220{
2221 assert(stream);
2222 assert(stream->ustream);
2223
2224 return ustctl_stream_get_wakeup_fd(stream->ustream);
2225}
2226
2227int lttng_ustconsumer_close_wakeup_fd(struct lttng_consumer_stream *stream)
2228{
2229 assert(stream);
2230 assert(stream->ustream);
2231
2232 return ustctl_stream_close_wakeup_fd(stream->ustream);
2233}
2234
309167d2
JD
2235/*
2236 * Populate index values of a UST stream. Values are set in big endian order.
2237 *
2238 * Return 0 on success or else a negative value.
2239 */
50adc264 2240static int get_index_values(struct ctf_packet_index *index,
309167d2
JD
2241 struct ustctl_consumer_stream *ustream)
2242{
2243 int ret;
2244
2245 ret = ustctl_get_timestamp_begin(ustream, &index->timestamp_begin);
2246 if (ret < 0) {
2247 PERROR("ustctl_get_timestamp_begin");
2248 goto error;
2249 }
2250 index->timestamp_begin = htobe64(index->timestamp_begin);
2251
2252 ret = ustctl_get_timestamp_end(ustream, &index->timestamp_end);
2253 if (ret < 0) {
2254 PERROR("ustctl_get_timestamp_end");
2255 goto error;
2256 }
2257 index->timestamp_end = htobe64(index->timestamp_end);
2258
2259 ret = ustctl_get_events_discarded(ustream, &index->events_discarded);
2260 if (ret < 0) {
2261 PERROR("ustctl_get_events_discarded");
2262 goto error;
2263 }
2264 index->events_discarded = htobe64(index->events_discarded);
2265
2266 ret = ustctl_get_content_size(ustream, &index->content_size);
2267 if (ret < 0) {
2268 PERROR("ustctl_get_content_size");
2269 goto error;
2270 }
2271 index->content_size = htobe64(index->content_size);
2272
2273 ret = ustctl_get_packet_size(ustream, &index->packet_size);
2274 if (ret < 0) {
2275 PERROR("ustctl_get_packet_size");
2276 goto error;
2277 }
2278 index->packet_size = htobe64(index->packet_size);
2279
2280 ret = ustctl_get_stream_id(ustream, &index->stream_id);
2281 if (ret < 0) {
2282 PERROR("ustctl_get_stream_id");
2283 goto error;
2284 }
2285 index->stream_id = htobe64(index->stream_id);
2286
234cd636
JD
2287 ret = ustctl_get_instance_id(ustream, &index->stream_instance_id);
2288 if (ret < 0) {
2289 PERROR("ustctl_get_instance_id");
2290 goto error;
2291 }
2292 index->stream_instance_id = htobe64(index->stream_instance_id);
2293
2294 ret = ustctl_get_sequence_number(ustream, &index->packet_seq_num);
2295 if (ret < 0) {
2296 PERROR("ustctl_get_sequence_number");
2297 goto error;
2298 }
2299 index->packet_seq_num = htobe64(index->packet_seq_num);
2300
309167d2
JD
2301error:
2302 return ret;
2303}
2304
93ec662e
JD
2305static
2306void metadata_stream_reset_cache(struct lttng_consumer_stream *stream,
2307 struct consumer_metadata_cache *cache)
2308{
2309 DBG("Metadata stream update to version %" PRIu64,
2310 cache->version);
2311 stream->ust_metadata_pushed = 0;
2312 stream->metadata_version = cache->version;
2313 stream->reset_metadata_flag = 1;
2314}
2315
2316/*
2317 * Check if the version of the metadata stream and metadata cache match.
2318 * If the cache got updated, reset the metadata stream.
2319 * The stream lock and metadata cache lock MUST be held.
2320 * Return 0 on success, a negative value on error.
2321 */
2322static
2323int metadata_stream_check_version(struct lttng_consumer_stream *stream)
2324{
2325 int ret = 0;
2326 struct consumer_metadata_cache *cache = stream->chan->metadata_cache;
2327
2328 if (cache->version == stream->metadata_version) {
2329 goto end;
2330 }
2331 metadata_stream_reset_cache(stream, cache);
2332
2333end:
2334 return ret;
2335}
2336
94d49140
JD
2337/*
2338 * Write up to one packet from the metadata cache to the channel.
2339 *
2340 * Returns the number of bytes pushed in the cache, or a negative value
2341 * on error.
2342 */
2343static
2344int commit_one_metadata_packet(struct lttng_consumer_stream *stream)
2345{
2346 ssize_t write_len;
2347 int ret;
2348
2349 pthread_mutex_lock(&stream->chan->metadata_cache->lock);
93ec662e
JD
2350 ret = metadata_stream_check_version(stream);
2351 if (ret < 0) {
2352 goto end;
2353 }
c585821b 2354 if (stream->chan->metadata_cache->max_offset
94d49140
JD
2355 == stream->ust_metadata_pushed) {
2356 ret = 0;
2357 goto end;
2358 }
2359
2360 write_len = ustctl_write_one_packet_to_channel(stream->chan->uchan,
2361 &stream->chan->metadata_cache->data[stream->ust_metadata_pushed],
c585821b 2362 stream->chan->metadata_cache->max_offset
94d49140
JD
2363 - stream->ust_metadata_pushed);
2364 assert(write_len != 0);
2365 if (write_len < 0) {
2366 ERR("Writing one metadata packet");
2367 ret = -1;
2368 goto end;
2369 }
2370 stream->ust_metadata_pushed += write_len;
2371
c585821b 2372 assert(stream->chan->metadata_cache->max_offset >=
94d49140
JD
2373 stream->ust_metadata_pushed);
2374 ret = write_len;
2375
2376end:
2377 pthread_mutex_unlock(&stream->chan->metadata_cache->lock);
2378 return ret;
2379}
2380
309167d2 2381
94d49140
JD
2382/*
2383 * Sync metadata meaning request them to the session daemon and snapshot to the
2384 * metadata thread can consumer them.
2385 *
c585821b
MD
2386 * Metadata stream lock is held here, but we need to release it when
2387 * interacting with sessiond, else we cause a deadlock with live
2388 * awaiting on metadata to be pushed out.
94d49140
JD
2389 *
2390 * Return 0 if new metadatda is available, EAGAIN if the metadata stream
2391 * is empty or a negative value on error.
2392 */
2393int lttng_ustconsumer_sync_metadata(struct lttng_consumer_local_data *ctx,
2394 struct lttng_consumer_stream *metadata)
2395{
2396 int ret;
2397 int retry = 0;
2398
2399 assert(ctx);
2400 assert(metadata);
2401
c585821b 2402 pthread_mutex_unlock(&metadata->lock);
94d49140
JD
2403 /*
2404 * Request metadata from the sessiond, but don't wait for the flush
2405 * because we locked the metadata thread.
2406 */
2407 ret = lttng_ustconsumer_request_metadata(ctx, metadata->chan, 0, 0);
1caeb2eb 2408 pthread_mutex_lock(&metadata->lock);
94d49140
JD
2409 if (ret < 0) {
2410 goto end;
2411 }
2412
2413 ret = commit_one_metadata_packet(metadata);
2414 if (ret <= 0) {
2415 goto end;
2416 } else if (ret > 0) {
2417 retry = 1;
2418 }
2419
2420 ustctl_flush_buffer(metadata->ustream, 1);
2421 ret = ustctl_snapshot(metadata->ustream);
2422 if (ret < 0) {
2423 if (errno != EAGAIN) {
2424 ERR("Sync metadata, taking UST snapshot");
2425 goto end;
2426 }
2427 DBG("No new metadata when syncing them.");
2428 /* No new metadata, exit. */
2429 ret = ENODATA;
2430 goto end;
2431 }
2432
2433 /*
2434 * After this flush, we still need to extract metadata.
2435 */
2436 if (retry) {
2437 ret = EAGAIN;
2438 }
2439
2440end:
2441 return ret;
2442}
2443
02b3d176
DG
2444/*
2445 * Return 0 on success else a negative value.
2446 */
2447static int notify_if_more_data(struct lttng_consumer_stream *stream,
2448 struct lttng_consumer_local_data *ctx)
2449{
2450 int ret;
2451 struct ustctl_consumer_stream *ustream;
2452
2453 assert(stream);
2454 assert(ctx);
2455
2456 ustream = stream->ustream;
2457
2458 /*
2459 * First, we are going to check if there is a new subbuffer available
2460 * before reading the stream wait_fd.
2461 */
2462 /* Get the next subbuffer */
2463 ret = ustctl_get_next_subbuf(ustream);
2464 if (ret) {
2465 /* No more data found, flag the stream. */
2466 stream->has_data = 0;
2467 ret = 0;
2468 goto end;
2469 }
2470
5420e5db 2471 ret = ustctl_put_subbuf(ustream);
02b3d176
DG
2472 assert(!ret);
2473
2474 /* This stream still has data. Flag it and wake up the data thread. */
2475 stream->has_data = 1;
2476
2477 if (stream->monitor && !stream->hangup_flush_done && !ctx->has_wakeup) {
2478 ssize_t writelen;
2479
2480 writelen = lttng_pipe_write(ctx->consumer_wakeup_pipe, "!", 1);
2481 if (writelen < 0 && errno != EAGAIN && errno != EWOULDBLOCK) {
2482 ret = writelen;
2483 goto end;
2484 }
2485
2486 /* The wake up pipe has been notified. */
2487 ctx->has_wakeup = 1;
2488 }
2489 ret = 0;
2490
2491end:
2492 return ret;
2493}
2494
fb83fe64
JD
2495static
2496int update_stream_stats(struct lttng_consumer_stream *stream)
2497{
2498 int ret;
2499 uint64_t seq, discarded;
2500
2501 ret = ustctl_get_sequence_number(stream->ustream, &seq);
2502 if (ret < 0) {
2503 PERROR("ustctl_get_sequence_number");
2504 goto end;
2505 }
2506 /*
2507 * Start the sequence when we extract the first packet in case we don't
2508 * start at 0 (for example if a consumer is not connected to the
2509 * session immediately after the beginning).
2510 */
2511 if (stream->last_sequence_number == -1ULL) {
2512 stream->last_sequence_number = seq;
2513 } else if (seq > stream->last_sequence_number) {
2514 stream->chan->lost_packets += seq -
2515 stream->last_sequence_number - 1;
2516 } else {
2517 /* seq <= last_sequence_number */
2518 ERR("Sequence number inconsistent : prev = %" PRIu64
2519 ", current = %" PRIu64,
2520 stream->last_sequence_number, seq);
2521 ret = -1;
2522 goto end;
2523 }
2524 stream->last_sequence_number = seq;
2525
2526 ret = ustctl_get_events_discarded(stream->ustream, &discarded);
2527 if (ret < 0) {
2528 PERROR("kernctl_get_events_discarded");
2529 goto end;
2530 }
2531 if (discarded < stream->last_discarded_events) {
2532 /*
83f4233d
MJ
2533 * Overflow has occurred. We assume only one wrap-around
2534 * has occurred.
fb83fe64
JD
2535 */
2536 stream->chan->discarded_events +=
2537 (1ULL << (CAA_BITS_PER_LONG - 1)) -
2538 stream->last_discarded_events + discarded;
2539 } else {
2540 stream->chan->discarded_events += discarded -
2541 stream->last_discarded_events;
2542 }
2543 stream->last_discarded_events = discarded;
2544 ret = 0;
2545
2546end:
2547 return ret;
2548}
2549
94d49140
JD
2550/*
2551 * Read subbuffer from the given stream.
2552 *
2553 * Stream lock MUST be acquired.
2554 *
2555 * Return 0 on success else a negative value.
2556 */
d41f73b7
MD
2557int lttng_ustconsumer_read_subbuffer(struct lttng_consumer_stream *stream,
2558 struct lttng_consumer_local_data *ctx)
2559{
1d4dfdef 2560 unsigned long len, subbuf_size, padding;
1c20f0e2 2561 int err, write_index = 1;
d41f73b7 2562 long ret = 0;
ffe60014 2563 struct ustctl_consumer_stream *ustream;
50adc264 2564 struct ctf_packet_index index;
ffe60014
DG
2565
2566 assert(stream);
2567 assert(stream->ustream);
2568 assert(ctx);
d41f73b7 2569
3eb914c0 2570 DBG("In UST read_subbuffer (wait_fd: %d, name: %s)", stream->wait_fd,
ffe60014
DG
2571 stream->name);
2572
2573 /* Ease our life for what's next. */
2574 ustream = stream->ustream;
d41f73b7 2575
6cd525e8 2576 /*
02b3d176
DG
2577 * We can consume the 1 byte written into the wait_fd by UST. Don't trigger
2578 * error if we cannot read this one byte (read returns 0), or if the error
2579 * is EAGAIN or EWOULDBLOCK.
2580 *
2581 * This is only done when the stream is monitored by a thread, before the
2582 * flush is done after a hangup and if the stream is not flagged with data
2583 * since there might be nothing to consume in the wait fd but still have
2584 * data available flagged by the consumer wake up pipe.
6cd525e8 2585 */
02b3d176
DG
2586 if (stream->monitor && !stream->hangup_flush_done && !stream->has_data) {
2587 char dummy;
c617c0c6
MD
2588 ssize_t readlen;
2589
6cd525e8
MD
2590 readlen = lttng_read(stream->wait_fd, &dummy, 1);
2591 if (readlen < 0 && errno != EAGAIN && errno != EWOULDBLOCK) {
effcf122
MD
2592 ret = readlen;
2593 goto end;
2594 }
d41f73b7
MD
2595 }
2596
04ef1097 2597retry:
d41f73b7 2598 /* Get the next subbuffer */
ffe60014 2599 err = ustctl_get_next_subbuf(ustream);
d41f73b7 2600 if (err != 0) {
04ef1097
MD
2601 /*
2602 * Populate metadata info if the existing info has
2603 * already been read.
2604 */
2605 if (stream->metadata_flag) {
94d49140
JD
2606 ret = commit_one_metadata_packet(stream);
2607 if (ret <= 0) {
04ef1097
MD
2608 goto end;
2609 }
04ef1097
MD
2610 ustctl_flush_buffer(stream->ustream, 1);
2611 goto retry;
2612 }
2613
1d4dfdef 2614 ret = err; /* ustctl_get_next_subbuf returns negative, caller expect positive. */
d41f73b7
MD
2615 /*
2616 * This is a debug message even for single-threaded consumer,
2617 * because poll() have more relaxed criterions than get subbuf,
2618 * so get_subbuf may fail for short race windows where poll()
2619 * would issue wakeups.
2620 */
2621 DBG("Reserving sub buffer failed (everything is normal, "
ffe60014 2622 "it is due to concurrency) [ret: %d]", err);
d41f73b7
MD
2623 goto end;
2624 }
ffe60014 2625 assert(stream->chan->output == CONSUMER_CHANNEL_MMAP);
309167d2 2626
1c20f0e2 2627 if (!stream->metadata_flag) {
309167d2
JD
2628 index.offset = htobe64(stream->out_fd_offset);
2629 ret = get_index_values(&index, ustream);
2630 if (ret < 0) {
7b87473d
MD
2631 err = ustctl_put_subbuf(ustream);
2632 assert(err == 0);
309167d2
JD
2633 goto end;
2634 }
fb83fe64
JD
2635
2636 /* Update the stream's sequence and discarded events count. */
2637 ret = update_stream_stats(stream);
2638 if (ret < 0) {
2639 PERROR("kernctl_get_events_discarded");
7b87473d
MD
2640 err = ustctl_put_subbuf(ustream);
2641 assert(err == 0);
fb83fe64
JD
2642 goto end;
2643 }
1c20f0e2
JD
2644 } else {
2645 write_index = 0;
309167d2
JD
2646 }
2647
1d4dfdef 2648 /* Get the full padded subbuffer size */
ffe60014 2649 err = ustctl_get_padded_subbuf_size(ustream, &len);
effcf122 2650 assert(err == 0);
1d4dfdef
DG
2651
2652 /* Get subbuffer data size (without padding) */
ffe60014 2653 err = ustctl_get_subbuf_size(ustream, &subbuf_size);
1d4dfdef
DG
2654 assert(err == 0);
2655
2656 /* Make sure we don't get a subbuffer size bigger than the padded */
2657 assert(len >= subbuf_size);
2658
2659 padding = len - subbuf_size;
d41f73b7 2660 /* write the subbuffer to the tracefile */
309167d2 2661 ret = lttng_consumer_on_read_subbuffer_mmap(ctx, stream, subbuf_size, padding, &index);
91dfef6e
DG
2662 /*
2663 * The mmap operation should write subbuf_size amount of data when network
2664 * streaming or the full padding (len) size when we are _not_ streaming.
2665 */
d88aee68
DG
2666 if ((ret != subbuf_size && stream->net_seq_idx != (uint64_t) -1ULL) ||
2667 (ret != len && stream->net_seq_idx == (uint64_t) -1ULL)) {
d41f73b7 2668 /*
91dfef6e 2669 * Display the error but continue processing to try to release the
c5c45efa
DG
2670 * subbuffer. This is a DBG statement since any unexpected kill or
2671 * signal, the application gets unregistered, relayd gets closed or
2672 * anything that affects the buffer lifetime will trigger this error.
2673 * So, for the sake of the user, don't print this error since it can
2674 * happen and it is OK with the code flow.
d41f73b7 2675 */
c5c45efa 2676 DBG("Error writing to tracefile "
8fd623e0 2677 "(ret: %ld != len: %lu != subbuf_size: %lu)",
91dfef6e 2678 ret, len, subbuf_size);
309167d2 2679 write_index = 0;
d41f73b7 2680 }
ffe60014 2681 err = ustctl_put_next_subbuf(ustream);
effcf122 2682 assert(err == 0);
331744e3 2683
02b3d176
DG
2684 /*
2685 * This will consumer the byte on the wait_fd if and only if there is not
2686 * next subbuffer to be acquired.
2687 */
2688 if (!stream->metadata_flag) {
2689 ret = notify_if_more_data(stream, ctx);
2690 if (ret < 0) {
2691 goto end;
2692 }
2693 }
2694
309167d2 2695 /* Write index if needed. */
1c20f0e2
JD
2696 if (!write_index) {
2697 goto end;
2698 }
2699
94d49140
JD
2700 if (stream->chan->live_timer_interval && !stream->metadata_flag) {
2701 /*
2702 * In live, block until all the metadata is sent.
2703 */
c585821b
MD
2704 pthread_mutex_lock(&stream->metadata_timer_lock);
2705 assert(!stream->missed_metadata_flush);
2706 stream->waiting_on_metadata = true;
2707 pthread_mutex_unlock(&stream->metadata_timer_lock);
2708
94d49140 2709 err = consumer_stream_sync_metadata(ctx, stream->session_id);
c585821b
MD
2710
2711 pthread_mutex_lock(&stream->metadata_timer_lock);
2712 stream->waiting_on_metadata = false;
2713 if (stream->missed_metadata_flush) {
2714 stream->missed_metadata_flush = false;
2715 pthread_mutex_unlock(&stream->metadata_timer_lock);
2716 (void) consumer_flush_ust_index(stream);
2717 } else {
2718 pthread_mutex_unlock(&stream->metadata_timer_lock);
2719 }
2720
94d49140
JD
2721 if (err < 0) {
2722 goto end;
2723 }
2724 }
2725
1c20f0e2
JD
2726 assert(!stream->metadata_flag);
2727 err = consumer_stream_write_index(stream, &index);
2728 if (err < 0) {
2729 goto end;
309167d2
JD
2730 }
2731
d41f73b7
MD
2732end:
2733 return ret;
2734}
2735
ffe60014
DG
2736/*
2737 * Called when a stream is created.
fe4477ee
JD
2738 *
2739 * Return 0 on success or else a negative value.
ffe60014 2740 */
d41f73b7
MD
2741int lttng_ustconsumer_on_recv_stream(struct lttng_consumer_stream *stream)
2742{
fe4477ee
JD
2743 int ret;
2744
10a50311
JD
2745 assert(stream);
2746
fe4477ee 2747 /* Don't create anything if this is set for streaming. */
10a50311 2748 if (stream->net_seq_idx == (uint64_t) -1ULL && stream->chan->monitor) {
fe4477ee
JD
2749 ret = utils_create_stream_file(stream->chan->pathname, stream->name,
2750 stream->chan->tracefile_size, stream->tracefile_count_current,
309167d2 2751 stream->uid, stream->gid, NULL);
fe4477ee
JD
2752 if (ret < 0) {
2753 goto error;
2754 }
2755 stream->out_fd = ret;
2756 stream->tracefile_size_current = 0;
309167d2
JD
2757
2758 if (!stream->metadata_flag) {
f8f3885c
MD
2759 struct lttng_index_file *index_file;
2760
2761 index_file = lttng_index_file_create(stream->chan->pathname,
309167d2
JD
2762 stream->name, stream->uid, stream->gid,
2763 stream->chan->tracefile_size,
f8f3885c
MD
2764 stream->tracefile_count_current,
2765 CTF_INDEX_MAJOR, CTF_INDEX_MINOR);
2766 if (!index_file) {
309167d2
JD
2767 goto error;
2768 }
1b47ae58 2769 assert(!stream->index_file);
f8f3885c 2770 stream->index_file = index_file;
309167d2 2771 }
fe4477ee
JD
2772 }
2773 ret = 0;
2774
2775error:
2776 return ret;
d41f73b7 2777}
ca22feea
DG
2778
2779/*
2780 * Check if data is still being extracted from the buffers for a specific
4e9a4686
DG
2781 * stream. Consumer data lock MUST be acquired before calling this function
2782 * and the stream lock.
ca22feea 2783 *
6d805429 2784 * Return 1 if the traced data are still getting read else 0 meaning that the
ca22feea
DG
2785 * data is available for trace viewer reading.
2786 */
6d805429 2787int lttng_ustconsumer_data_pending(struct lttng_consumer_stream *stream)
ca22feea
DG
2788{
2789 int ret;
2790
2791 assert(stream);
ffe60014 2792 assert(stream->ustream);
ca22feea 2793
6d805429 2794 DBG("UST consumer checking data pending");
c8f59ee5 2795
ca6b395f
MD
2796 if (stream->endpoint_status != CONSUMER_ENDPOINT_ACTIVE) {
2797 ret = 0;
2798 goto end;
2799 }
2800
04ef1097 2801 if (stream->chan->type == CONSUMER_CHANNEL_TYPE_METADATA) {
e6ee4eab
DG
2802 uint64_t contiguous, pushed;
2803
2804 /* Ease our life a bit. */
c585821b 2805 contiguous = stream->chan->metadata_cache->max_offset;
e6ee4eab
DG
2806 pushed = stream->ust_metadata_pushed;
2807
04ef1097
MD
2808 /*
2809 * We can simply check whether all contiguously available data
2810 * has been pushed to the ring buffer, since the push operation
2811 * is performed within get_next_subbuf(), and because both
2812 * get_next_subbuf() and put_next_subbuf() are issued atomically
2813 * thanks to the stream lock within
2814 * lttng_ustconsumer_read_subbuffer(). This basically means that
2815 * whetnever ust_metadata_pushed is incremented, the associated
2816 * metadata has been consumed from the metadata stream.
2817 */
2818 DBG("UST consumer metadata pending check: contiguous %" PRIu64 " vs pushed %" PRIu64,
e6ee4eab 2819 contiguous, pushed);
aa01b94c 2820 assert(((int64_t) (contiguous - pushed)) >= 0);
e6ee4eab 2821 if ((contiguous != pushed) ||
6acdf328 2822 (((int64_t) contiguous - pushed) > 0 || contiguous == 0)) {
04ef1097
MD
2823 ret = 1; /* Data is pending */
2824 goto end;
2825 }
2826 } else {
2827 ret = ustctl_get_next_subbuf(stream->ustream);
2828 if (ret == 0) {
2829 /*
2830 * There is still data so let's put back this
2831 * subbuffer.
2832 */
2833 ret = ustctl_put_subbuf(stream->ustream);
2834 assert(ret == 0);
2835 ret = 1; /* Data is pending */
2836 goto end;
2837 }
ca22feea
DG
2838 }
2839
6d805429
DG
2840 /* Data is NOT pending so ready to be read. */
2841 ret = 0;
ca22feea 2842
6efae65e
DG
2843end:
2844 return ret;
ca22feea 2845}
d88aee68 2846
6d574024
DG
2847/*
2848 * Stop a given metadata channel timer if enabled and close the wait fd which
2849 * is the poll pipe of the metadata stream.
2850 *
2851 * This MUST be called with the metadata channel acquired.
2852 */
2853void lttng_ustconsumer_close_metadata(struct lttng_consumer_channel *metadata)
2854{
2855 int ret;
2856
2857 assert(metadata);
2858 assert(metadata->type == CONSUMER_CHANNEL_TYPE_METADATA);
2859
2860 DBG("Closing metadata channel key %" PRIu64, metadata->key);
2861
2862 if (metadata->switch_timer_enabled == 1) {
2863 consumer_timer_switch_stop(metadata);
2864 }
2865
2866 if (!metadata->metadata_stream) {
2867 goto end;
2868 }
2869
2870 /*
2871 * Closing write side so the thread monitoring the stream wakes up if any
2872 * and clean the metadata stream.
2873 */
2874 if (metadata->metadata_stream->ust_metadata_poll_pipe[1] >= 0) {
2875 ret = close(metadata->metadata_stream->ust_metadata_poll_pipe[1]);
2876 if (ret < 0) {
2877 PERROR("closing metadata pipe write side");
2878 }
2879 metadata->metadata_stream->ust_metadata_poll_pipe[1] = -1;
2880 }
2881
2882end:
2883 return;
2884}
2885
d88aee68
DG
2886/*
2887 * Close every metadata stream wait fd of the metadata hash table. This
2888 * function MUST be used very carefully so not to run into a race between the
2889 * metadata thread handling streams and this function closing their wait fd.
2890 *
2891 * For UST, this is used when the session daemon hangs up. Its the metadata
2892 * producer so calling this is safe because we are assured that no state change
2893 * can occur in the metadata thread for the streams in the hash table.
2894 */
6d574024 2895void lttng_ustconsumer_close_all_metadata(struct lttng_ht *metadata_ht)
d88aee68 2896{
d88aee68
DG
2897 struct lttng_ht_iter iter;
2898 struct lttng_consumer_stream *stream;
2899
2900 assert(metadata_ht);
2901 assert(metadata_ht->ht);
2902
2903 DBG("UST consumer closing all metadata streams");
2904
2905 rcu_read_lock();
2906 cds_lfht_for_each_entry(metadata_ht->ht, &iter.iter, stream,
2907 node.node) {
9ce5646a
MD
2908
2909 health_code_update();
2910
be2b50c7 2911 pthread_mutex_lock(&stream->chan->lock);
6d574024 2912 lttng_ustconsumer_close_metadata(stream->chan);
be2b50c7
DG
2913 pthread_mutex_unlock(&stream->chan->lock);
2914
d88aee68
DG
2915 }
2916 rcu_read_unlock();
2917}
d8ef542d
MD
2918
2919void lttng_ustconsumer_close_stream_wakeup(struct lttng_consumer_stream *stream)
2920{
2921 int ret;
2922
2923 ret = ustctl_stream_close_wakeup_fd(stream->ustream);
2924 if (ret < 0) {
2925 ERR("Unable to close wakeup fd");
2926 }
2927}
331744e3 2928
f666ae70
MD
2929/*
2930 * Please refer to consumer-timer.c before adding any lock within this
2931 * function or any of its callees. Timers have a very strict locking
2932 * semantic with respect to teardown. Failure to respect this semantic
2933 * introduces deadlocks.
c585821b
MD
2934 *
2935 * DON'T hold the metadata lock when calling this function, else this
2936 * can cause deadlock involving consumer awaiting for metadata to be
2937 * pushed out due to concurrent interaction with the session daemon.
f666ae70 2938 */
331744e3 2939int lttng_ustconsumer_request_metadata(struct lttng_consumer_local_data *ctx,
94d49140 2940 struct lttng_consumer_channel *channel, int timer, int wait)
331744e3
JD
2941{
2942 struct lttcomm_metadata_request_msg request;
2943 struct lttcomm_consumer_msg msg;
0c759fc9 2944 enum lttcomm_return_code ret_code = LTTCOMM_CONSUMERD_SUCCESS;
93ec662e 2945 uint64_t len, key, offset, version;
331744e3
JD
2946 int ret;
2947
2948 assert(channel);
2949 assert(channel->metadata_cache);
2950
53efb85a
MD
2951 memset(&request, 0, sizeof(request));
2952
331744e3
JD
2953 /* send the metadata request to sessiond */
2954 switch (consumer_data.type) {
2955 case LTTNG_CONSUMER64_UST:
2956 request.bits_per_long = 64;
2957 break;
2958 case LTTNG_CONSUMER32_UST:
2959 request.bits_per_long = 32;
2960 break;
2961 default:
2962 request.bits_per_long = 0;
2963 break;
2964 }
2965
2966 request.session_id = channel->session_id;
1950109e 2967 request.session_id_per_pid = channel->session_id_per_pid;
567eb353
DG
2968 /*
2969 * Request the application UID here so the metadata of that application can
2970 * be sent back. The channel UID corresponds to the user UID of the session
2971 * used for the rights on the stream file(s).
2972 */
2973 request.uid = channel->ust_app_uid;
331744e3 2974 request.key = channel->key;
567eb353 2975
1950109e 2976 DBG("Sending metadata request to sessiond, session id %" PRIu64
ac5b9467 2977 ", per-pid %" PRIu64 ", app UID %u and channel key %" PRIu64,
567eb353
DG
2978 request.session_id, request.session_id_per_pid, request.uid,
2979 request.key);
331744e3 2980
75d83e50 2981 pthread_mutex_lock(&ctx->metadata_socket_lock);
9ce5646a
MD
2982
2983 health_code_update();
2984
331744e3
JD
2985 ret = lttcomm_send_unix_sock(ctx->consumer_metadata_socket, &request,
2986 sizeof(request));
2987 if (ret < 0) {
2988 ERR("Asking metadata to sessiond");
2989 goto end;
2990 }
2991
9ce5646a
MD
2992 health_code_update();
2993
331744e3
JD
2994 /* Receive the metadata from sessiond */
2995 ret = lttcomm_recv_unix_sock(ctx->consumer_metadata_socket, &msg,
2996 sizeof(msg));
2997 if (ret != sizeof(msg)) {
8fd623e0 2998 DBG("Consumer received unexpected message size %d (expects %zu)",
331744e3
JD
2999 ret, sizeof(msg));
3000 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_ERROR_RECV_CMD);
3001 /*
3002 * The ret value might 0 meaning an orderly shutdown but this is ok
3003 * since the caller handles this.
3004 */
3005 goto end;
3006 }
3007
9ce5646a
MD
3008 health_code_update();
3009
331744e3
JD
3010 if (msg.cmd_type == LTTNG_ERR_UND) {
3011 /* No registry found */
3012 (void) consumer_send_status_msg(ctx->consumer_metadata_socket,
3013 ret_code);
3014 ret = 0;
3015 goto end;
3016 } else if (msg.cmd_type != LTTNG_CONSUMER_PUSH_METADATA) {
3017 ERR("Unexpected cmd_type received %d", msg.cmd_type);
3018 ret = -1;
3019 goto end;
3020 }
3021
3022 len = msg.u.push_metadata.len;
3023 key = msg.u.push_metadata.key;
3024 offset = msg.u.push_metadata.target_offset;
93ec662e 3025 version = msg.u.push_metadata.version;
331744e3
JD
3026
3027 assert(key == channel->key);
3028 if (len == 0) {
3029 DBG("No new metadata to receive for key %" PRIu64, key);
3030 }
3031
9ce5646a
MD
3032 health_code_update();
3033
331744e3
JD
3034 /* Tell session daemon we are ready to receive the metadata. */
3035 ret = consumer_send_status_msg(ctx->consumer_metadata_socket,
0c759fc9 3036 LTTCOMM_CONSUMERD_SUCCESS);
331744e3
JD
3037 if (ret < 0 || len == 0) {
3038 /*
3039 * Somehow, the session daemon is not responding anymore or there is
3040 * nothing to receive.
3041 */
3042 goto end;
3043 }
3044
9ce5646a
MD
3045 health_code_update();
3046
1eb682be 3047 ret = lttng_ustconsumer_recv_metadata(ctx->consumer_metadata_socket,
93ec662e 3048 key, offset, len, version, channel, timer, wait);
1eb682be 3049 if (ret >= 0) {
f2a444f1
DG
3050 /*
3051 * Only send the status msg if the sessiond is alive meaning a positive
3052 * ret code.
3053 */
1eb682be 3054 (void) consumer_send_status_msg(ctx->consumer_metadata_socket, ret);
f2a444f1 3055 }
331744e3
JD
3056 ret = 0;
3057
3058end:
9ce5646a
MD
3059 health_code_update();
3060
75d83e50 3061 pthread_mutex_unlock(&ctx->metadata_socket_lock);
331744e3
JD
3062 return ret;
3063}
70190e1c
DG
3064
3065/*
3066 * Return the ustctl call for the get stream id.
3067 */
3068int lttng_ustconsumer_get_stream_id(struct lttng_consumer_stream *stream,
3069 uint64_t *stream_id)
3070{
3071 assert(stream);
3072 assert(stream_id);
3073
3074 return ustctl_get_stream_id(stream->ustream, stream_id);
3075}
This page took 0.229978 seconds and 5 git commands to generate.