Use free running metadata channel key between sessiond and kernel consumer
[lttng-tools.git] / src / common / kernel-consumer / kernel-consumer.c
CommitLineData
3bd1e081
MD
1/*
2 * Copyright (C) 2011 - Julien Desfossez <julien.desfossez@polymtl.ca>
3 * Mathieu Desnoyers <mathieu.desnoyers@efficios.com>
b3530820 4 * Copyright (C) 2017 - Jérémie Galarneau <jeremie.galarneau@efficios.com>
3bd1e081 5 *
d14d33bf
AM
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License, version 2 only,
8 * as published by the Free Software Foundation.
3bd1e081
MD
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
d14d33bf
AM
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
3bd1e081
MD
18 */
19
6c1c0768 20#define _LGPL_SOURCE
3bd1e081 21#include <assert.h>
3bd1e081
MD
22#include <poll.h>
23#include <pthread.h>
24#include <stdlib.h>
25#include <string.h>
26#include <sys/mman.h>
27#include <sys/socket.h>
28#include <sys/types.h>
77c7c900 29#include <inttypes.h>
3bd1e081 30#include <unistd.h>
dbb5dfe6 31#include <sys/stat.h>
3bd1e081 32
51a9e1c7 33#include <bin/lttng-consumerd/health-consumerd.h>
990570ed 34#include <common/common.h>
10a8a223 35#include <common/kernel-ctl/kernel-ctl.h>
10a8a223 36#include <common/sessiond-comm/sessiond-comm.h>
00e2e675 37#include <common/sessiond-comm/relayd.h>
dbb5dfe6 38#include <common/compat/fcntl.h>
f263b7fd 39#include <common/compat/endian.h>
acdb9057 40#include <common/pipe.h>
00e2e675 41#include <common/relayd/relayd.h>
fe4477ee 42#include <common/utils.h>
c8fea79c 43#include <common/consumer/consumer-stream.h>
309167d2 44#include <common/index/index.h>
c8fea79c 45#include <common/consumer/consumer-timer.h>
0857097f 46
10a8a223 47#include "kernel-consumer.h"
3bd1e081
MD
48
49extern struct lttng_consumer_global_data consumer_data;
50extern int consumer_poll_timeout;
3bd1e081 51
3bd1e081
MD
52/*
53 * Take a snapshot for a specific fd
54 *
55 * Returns 0 on success, < 0 on error
56 */
ffe60014 57int lttng_kconsumer_take_snapshot(struct lttng_consumer_stream *stream)
3bd1e081
MD
58{
59 int ret = 0;
60 int infd = stream->wait_fd;
61
62 ret = kernctl_snapshot(infd);
63 if (ret != 0) {
5a510c9f 64 PERROR("Getting sub-buffer snapshot.");
3bd1e081
MD
65 }
66
67 return ret;
68}
69
e9404c27
JG
70/*
71 * Sample consumed and produced positions for a specific fd.
72 *
73 * Returns 0 on success, < 0 on error.
74 */
75int lttng_kconsumer_sample_snapshot_positions(
76 struct lttng_consumer_stream *stream)
77{
78 assert(stream);
79
80 return kernctl_snapshot_sample_positions(stream->wait_fd);
81}
82
3bd1e081
MD
83/*
84 * Get the produced position
85 *
86 * Returns 0 on success, < 0 on error
87 */
ffe60014 88int lttng_kconsumer_get_produced_snapshot(struct lttng_consumer_stream *stream,
3bd1e081
MD
89 unsigned long *pos)
90{
91 int ret;
92 int infd = stream->wait_fd;
93
94 ret = kernctl_snapshot_get_produced(infd, pos);
95 if (ret != 0) {
5a510c9f 96 PERROR("kernctl_snapshot_get_produced");
3bd1e081
MD
97 }
98
99 return ret;
100}
101
07b86b52
JD
102/*
103 * Get the consumerd position
104 *
105 * Returns 0 on success, < 0 on error
106 */
107int lttng_kconsumer_get_consumed_snapshot(struct lttng_consumer_stream *stream,
108 unsigned long *pos)
109{
110 int ret;
111 int infd = stream->wait_fd;
112
113 ret = kernctl_snapshot_get_consumed(infd, pos);
114 if (ret != 0) {
5a510c9f 115 PERROR("kernctl_snapshot_get_consumed");
07b86b52
JD
116 }
117
118 return ret;
119}
120
07b86b52
JD
121/*
122 * Take a snapshot of all the stream of a channel
123 *
124 * Returns 0 on success, < 0 on error
125 */
126int lttng_kconsumer_snapshot_channel(uint64_t key, char *path,
d07ceecd 127 uint64_t relayd_id, uint64_t nb_packets_per_stream,
5c786ded 128 struct lttng_consumer_local_data *ctx)
07b86b52
JD
129{
130 int ret;
07b86b52
JD
131 struct lttng_consumer_channel *channel;
132 struct lttng_consumer_stream *stream;
133
6a00837f 134 DBG("Kernel consumer snapshot channel %" PRIu64, key);
07b86b52
JD
135
136 rcu_read_lock();
137
138 channel = consumer_find_channel(key);
139 if (!channel) {
6a00837f 140 ERR("No channel found for key %" PRIu64, key);
07b86b52
JD
141 ret = -1;
142 goto end;
143 }
144
145 /* Splice is not supported yet for channel snapshot. */
146 if (channel->output != CONSUMER_CHANNEL_MMAP) {
147 ERR("Unsupported output %d", channel->output);
148 ret = -1;
149 goto end;
150 }
151
10a50311 152 cds_list_for_each_entry(stream, &channel->streams.head, send_node) {
923333cd 153 unsigned long consumed_pos, produced_pos;
9ce5646a
MD
154
155 health_code_update();
156
07b86b52
JD
157 /*
158 * Lock stream because we are about to change its state.
159 */
160 pthread_mutex_lock(&stream->lock);
161
29decac3
DG
162 /*
163 * Assign the received relayd ID so we can use it for streaming. The streams
164 * are not visible to anyone so this is OK to change it.
165 */
07b86b52
JD
166 stream->net_seq_idx = relayd_id;
167 channel->relayd_id = relayd_id;
168 if (relayd_id != (uint64_t) -1ULL) {
10a50311 169 ret = consumer_send_relayd_stream(stream, path);
07b86b52
JD
170 if (ret < 0) {
171 ERR("sending stream to relayd");
172 goto end_unlock;
173 }
07b86b52
JD
174 } else {
175 ret = utils_create_stream_file(path, stream->name,
10a50311
JD
176 stream->chan->tracefile_size,
177 stream->tracefile_count_current,
309167d2 178 stream->uid, stream->gid, NULL);
07b86b52
JD
179 if (ret < 0) {
180 ERR("utils_create_stream_file");
181 goto end_unlock;
182 }
183
184 stream->out_fd = ret;
185 stream->tracefile_size_current = 0;
186
81ea21bf
MD
187 DBG("Kernel consumer snapshot stream %s/%s (%" PRIu64 ")",
188 path, stream->name, stream->key);
07b86b52
JD
189 }
190
f22dd891 191 ret = kernctl_buffer_flush_empty(stream->wait_fd);
07b86b52 192 if (ret < 0) {
f22dd891
MD
193 /*
194 * Doing a buffer flush which does not take into
195 * account empty packets. This is not perfect
196 * for stream intersection, but required as a
197 * fall-back when "flush_empty" is not
198 * implemented by lttng-modules.
199 */
200 ret = kernctl_buffer_flush(stream->wait_fd);
201 if (ret < 0) {
202 ERR("Failed to flush kernel stream");
203 goto end_unlock;
204 }
07b86b52
JD
205 goto end_unlock;
206 }
207
208 ret = lttng_kconsumer_take_snapshot(stream);
209 if (ret < 0) {
210 ERR("Taking kernel snapshot");
211 goto end_unlock;
212 }
213
214 ret = lttng_kconsumer_get_produced_snapshot(stream, &produced_pos);
215 if (ret < 0) {
216 ERR("Produced kernel snapshot position");
217 goto end_unlock;
218 }
219
220 ret = lttng_kconsumer_get_consumed_snapshot(stream, &consumed_pos);
221 if (ret < 0) {
222 ERR("Consumerd kernel snapshot position");
223 goto end_unlock;
224 }
225
226 if (stream->max_sb_size == 0) {
227 ret = kernctl_get_max_subbuf_size(stream->wait_fd,
228 &stream->max_sb_size);
229 if (ret < 0) {
230 ERR("Getting kernel max_sb_size");
231 goto end_unlock;
232 }
233 }
234
d07ceecd
MD
235 consumed_pos = consumer_get_consume_start_pos(consumed_pos,
236 produced_pos, nb_packets_per_stream,
237 stream->max_sb_size);
5c786ded 238
07b86b52
JD
239 while (consumed_pos < produced_pos) {
240 ssize_t read_len;
241 unsigned long len, padded_len;
242
9ce5646a
MD
243 health_code_update();
244
07b86b52
JD
245 DBG("Kernel consumer taking snapshot at pos %lu", consumed_pos);
246
247 ret = kernctl_get_subbuf(stream->wait_fd, &consumed_pos);
248 if (ret < 0) {
32af2c95 249 if (ret != -EAGAIN) {
07b86b52
JD
250 PERROR("kernctl_get_subbuf snapshot");
251 goto end_unlock;
252 }
253 DBG("Kernel consumer get subbuf failed. Skipping it.");
254 consumed_pos += stream->max_sb_size;
ddc93ee4 255 stream->chan->lost_packets++;
07b86b52
JD
256 continue;
257 }
258
259 ret = kernctl_get_subbuf_size(stream->wait_fd, &len);
260 if (ret < 0) {
261 ERR("Snapshot kernctl_get_subbuf_size");
29decac3 262 goto error_put_subbuf;
07b86b52
JD
263 }
264
265 ret = kernctl_get_padded_subbuf_size(stream->wait_fd, &padded_len);
266 if (ret < 0) {
267 ERR("Snapshot kernctl_get_padded_subbuf_size");
29decac3 268 goto error_put_subbuf;
07b86b52
JD
269 }
270
271 read_len = lttng_consumer_on_read_subbuffer_mmap(ctx, stream, len,
309167d2 272 padded_len - len, NULL);
07b86b52 273 /*
29decac3
DG
274 * We write the padded len in local tracefiles but the data len
275 * when using a relay. Display the error but continue processing
276 * to try to release the subbuffer.
07b86b52
JD
277 */
278 if (relayd_id != (uint64_t) -1ULL) {
279 if (read_len != len) {
280 ERR("Error sending to the relay (ret: %zd != len: %lu)",
281 read_len, len);
282 }
283 } else {
284 if (read_len != padded_len) {
285 ERR("Error writing to tracefile (ret: %zd != len: %lu)",
286 read_len, padded_len);
287 }
288 }
289
290 ret = kernctl_put_subbuf(stream->wait_fd);
291 if (ret < 0) {
292 ERR("Snapshot kernctl_put_subbuf");
293 goto end_unlock;
294 }
295 consumed_pos += stream->max_sb_size;
296 }
297
298 if (relayd_id == (uint64_t) -1ULL) {
fdf9986c
MD
299 if (stream->out_fd >= 0) {
300 ret = close(stream->out_fd);
301 if (ret < 0) {
302 PERROR("Kernel consumer snapshot close out_fd");
303 goto end_unlock;
304 }
305 stream->out_fd = -1;
07b86b52 306 }
07b86b52
JD
307 } else {
308 close_relayd_stream(stream);
309 stream->net_seq_idx = (uint64_t) -1ULL;
310 }
311 pthread_mutex_unlock(&stream->lock);
312 }
313
314 /* All good! */
315 ret = 0;
316 goto end;
317
29decac3
DG
318error_put_subbuf:
319 ret = kernctl_put_subbuf(stream->wait_fd);
320 if (ret < 0) {
321 ERR("Snapshot kernctl_put_subbuf error path");
322 }
07b86b52
JD
323end_unlock:
324 pthread_mutex_unlock(&stream->lock);
325end:
326 rcu_read_unlock();
327 return ret;
328}
329
330/*
331 * Read the whole metadata available for a snapshot.
332 *
333 * Returns 0 on success, < 0 on error
334 */
335int lttng_kconsumer_snapshot_metadata(uint64_t key, char *path,
e2039c7a 336 uint64_t relayd_id, struct lttng_consumer_local_data *ctx)
07b86b52 337{
d771f832
DG
338 int ret, use_relayd = 0;
339 ssize_t ret_read;
07b86b52
JD
340 struct lttng_consumer_channel *metadata_channel;
341 struct lttng_consumer_stream *metadata_stream;
d771f832
DG
342
343 assert(ctx);
07b86b52
JD
344
345 DBG("Kernel consumer snapshot metadata with key %" PRIu64 " at path %s",
346 key, path);
347
348 rcu_read_lock();
349
350 metadata_channel = consumer_find_channel(key);
351 if (!metadata_channel) {
d771f832 352 ERR("Kernel snapshot metadata not found for key %" PRIu64, key);
07b86b52 353 ret = -1;
d771f832 354 goto error;
07b86b52
JD
355 }
356
357 metadata_stream = metadata_channel->metadata_stream;
358 assert(metadata_stream);
359
d771f832 360 /* Flag once that we have a valid relayd for the stream. */
e2039c7a 361 if (relayd_id != (uint64_t) -1ULL) {
d771f832
DG
362 use_relayd = 1;
363 }
364
365 if (use_relayd) {
10a50311 366 ret = consumer_send_relayd_stream(metadata_stream, path);
e2039c7a 367 if (ret < 0) {
d771f832 368 goto error;
e2039c7a 369 }
e2039c7a
JD
370 } else {
371 ret = utils_create_stream_file(path, metadata_stream->name,
372 metadata_stream->chan->tracefile_size,
373 metadata_stream->tracefile_count_current,
309167d2 374 metadata_stream->uid, metadata_stream->gid, NULL);
e2039c7a 375 if (ret < 0) {
d771f832 376 goto error;
e2039c7a
JD
377 }
378 metadata_stream->out_fd = ret;
07b86b52 379 }
07b86b52 380
d771f832 381 do {
9ce5646a
MD
382 health_code_update();
383
d771f832
DG
384 ret_read = lttng_kconsumer_read_subbuffer(metadata_stream, ctx);
385 if (ret_read < 0) {
56591bac 386 if (ret_read != -EAGAIN) {
6a00837f 387 ERR("Kernel snapshot reading metadata subbuffer (ret: %zd)",
d771f832
DG
388 ret_read);
389 goto error;
07b86b52 390 }
d771f832 391 /* ret_read is negative at this point so we will exit the loop. */
07b86b52
JD
392 continue;
393 }
d771f832 394 } while (ret_read >= 0);
07b86b52 395
d771f832
DG
396 if (use_relayd) {
397 close_relayd_stream(metadata_stream);
398 metadata_stream->net_seq_idx = (uint64_t) -1ULL;
399 } else {
fdf9986c
MD
400 if (metadata_stream->out_fd >= 0) {
401 ret = close(metadata_stream->out_fd);
402 if (ret < 0) {
403 PERROR("Kernel consumer snapshot metadata close out_fd");
404 /*
405 * Don't go on error here since the snapshot was successful at this
406 * point but somehow the close failed.
407 */
408 }
409 metadata_stream->out_fd = -1;
e2039c7a 410 }
e2039c7a
JD
411 }
412
07b86b52 413 ret = 0;
d771f832 414
cf53a8a6
JD
415 cds_list_del(&metadata_stream->send_node);
416 consumer_stream_destroy(metadata_stream, NULL);
417 metadata_channel->metadata_stream = NULL;
d771f832 418error:
07b86b52
JD
419 rcu_read_unlock();
420 return ret;
421}
422
1803a064
MD
423/*
424 * Receive command from session daemon and process it.
425 *
426 * Return 1 on success else a negative value or 0.
427 */
3bd1e081
MD
428int lttng_kconsumer_recv_cmd(struct lttng_consumer_local_data *ctx,
429 int sock, struct pollfd *consumer_sockpoll)
430{
431 ssize_t ret;
0c759fc9 432 enum lttcomm_return_code ret_code = LTTCOMM_CONSUMERD_SUCCESS;
3bd1e081
MD
433 struct lttcomm_consumer_msg msg;
434
9ce5646a
MD
435 health_code_update();
436
3bd1e081
MD
437 ret = lttcomm_recv_unix_sock(sock, &msg, sizeof(msg));
438 if (ret != sizeof(msg)) {
1803a064 439 if (ret > 0) {
c6857fcf 440 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_ERROR_RECV_CMD);
1803a064
MD
441 ret = -1;
442 }
3bd1e081
MD
443 return ret;
444 }
9ce5646a
MD
445
446 health_code_update();
447
84382d49
MD
448 /* Deprecated command */
449 assert(msg.cmd_type != LTTNG_CONSUMER_STOP);
3bd1e081 450
9ce5646a
MD
451 health_code_update();
452
b0b335c8
MD
453 /* relayd needs RCU read-side protection */
454 rcu_read_lock();
455
3bd1e081 456 switch (msg.cmd_type) {
00e2e675
DG
457 case LTTNG_CONSUMER_ADD_RELAYD_SOCKET:
458 {
f50f23d9 459 /* Session daemon status message are handled in the following call. */
2527bf85 460 consumer_add_relayd_socket(msg.u.relayd_sock.net_index,
7735ef9e 461 msg.u.relayd_sock.type, ctx, sock, consumer_sockpoll,
d3e2ba59 462 &msg.u.relayd_sock.sock, msg.u.relayd_sock.session_id,
2527bf85 463 msg.u.relayd_sock.relayd_session_id);
00e2e675
DG
464 goto end_nosignal;
465 }
3bd1e081
MD
466 case LTTNG_CONSUMER_ADD_CHANNEL:
467 {
468 struct lttng_consumer_channel *new_channel;
e43c41c5 469 int ret_recv;
3bd1e081 470
9ce5646a
MD
471 health_code_update();
472
f50f23d9
DG
473 /* First send a status message before receiving the fds. */
474 ret = consumer_send_status_msg(sock, ret_code);
475 if (ret < 0) {
476 /* Somehow, the session daemon is not responding anymore. */
1803a064 477 goto error_fatal;
f50f23d9 478 }
9ce5646a
MD
479
480 health_code_update();
481
d88aee68 482 DBG("consumer_add_channel %" PRIu64, msg.u.channel.channel_key);
3bd1e081 483 new_channel = consumer_allocate_channel(msg.u.channel.channel_key,
ffe60014
DG
484 msg.u.channel.session_id, msg.u.channel.pathname,
485 msg.u.channel.name, msg.u.channel.uid, msg.u.channel.gid,
1624d5b7
JD
486 msg.u.channel.relayd_id, msg.u.channel.output,
487 msg.u.channel.tracefile_size,
1950109e 488 msg.u.channel.tracefile_count, 0,
ecc48a90 489 msg.u.channel.monitor,
d7ba1388 490 msg.u.channel.live_timer_interval,
3d071855 491 NULL, NULL);
3bd1e081 492 if (new_channel == NULL) {
f73fabfd 493 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_OUTFD_ERROR);
3bd1e081
MD
494 goto end_nosignal;
495 }
ffe60014 496 new_channel->nb_init_stream_left = msg.u.channel.nb_init_streams;
95a1109b
JD
497 switch (msg.u.channel.output) {
498 case LTTNG_EVENT_SPLICE:
499 new_channel->output = CONSUMER_CHANNEL_SPLICE;
500 break;
501 case LTTNG_EVENT_MMAP:
502 new_channel->output = CONSUMER_CHANNEL_MMAP;
503 break;
504 default:
505 ERR("Channel output unknown %d", msg.u.channel.output);
506 goto end_nosignal;
507 }
ffe60014
DG
508
509 /* Translate and save channel type. */
510 switch (msg.u.channel.type) {
511 case CONSUMER_CHANNEL_TYPE_DATA:
512 case CONSUMER_CHANNEL_TYPE_METADATA:
513 new_channel->type = msg.u.channel.type;
514 break;
515 default:
516 assert(0);
517 goto end_nosignal;
518 };
519
9ce5646a
MD
520 health_code_update();
521
3bd1e081 522 if (ctx->on_recv_channel != NULL) {
e43c41c5
JD
523 ret_recv = ctx->on_recv_channel(new_channel);
524 if (ret_recv == 0) {
525 ret = consumer_add_channel(new_channel, ctx);
526 } else if (ret_recv < 0) {
3bd1e081
MD
527 goto end_nosignal;
528 }
529 } else {
e43c41c5 530 ret = consumer_add_channel(new_channel, ctx);
3bd1e081 531 }
e9404c27
JG
532 if (msg.u.channel.type == CONSUMER_CHANNEL_TYPE_DATA && !ret) {
533 int monitor_start_ret;
534
535 DBG("Consumer starting monitor timer");
94d49140
JD
536 consumer_timer_live_start(new_channel,
537 msg.u.channel.live_timer_interval);
e9404c27
JG
538 monitor_start_ret = consumer_timer_monitor_start(
539 new_channel,
540 msg.u.channel.monitor_timer_interval);
541 if (monitor_start_ret < 0) {
542 ERR("Starting channel monitoring timer failed");
543 goto end_nosignal;
544 }
545
94d49140 546 }
e43c41c5 547
9ce5646a
MD
548 health_code_update();
549
e43c41c5 550 /* If we received an error in add_channel, we need to report it. */
821fffb2 551 if (ret < 0) {
1803a064
MD
552 ret = consumer_send_status_msg(sock, ret);
553 if (ret < 0) {
554 goto error_fatal;
555 }
e43c41c5
JD
556 goto end_nosignal;
557 }
558
3bd1e081
MD
559 goto end_nosignal;
560 }
561 case LTTNG_CONSUMER_ADD_STREAM:
562 {
dae10966
DG
563 int fd;
564 struct lttng_pipe *stream_pipe;
00e2e675 565 struct lttng_consumer_stream *new_stream;
ffe60014 566 struct lttng_consumer_channel *channel;
c80048c6 567 int alloc_ret = 0;
3bd1e081 568
ffe60014
DG
569 /*
570 * Get stream's channel reference. Needed when adding the stream to the
571 * global hash table.
572 */
573 channel = consumer_find_channel(msg.u.stream.channel_key);
574 if (!channel) {
575 /*
576 * We could not find the channel. Can happen if cpu hotplug
577 * happens while tearing down.
578 */
d88aee68 579 ERR("Unable to find channel key %" PRIu64, msg.u.stream.channel_key);
e462382a 580 ret_code = LTTCOMM_CONSUMERD_CHAN_NOT_FOUND;
ffe60014
DG
581 }
582
9ce5646a
MD
583 health_code_update();
584
f50f23d9
DG
585 /* First send a status message before receiving the fds. */
586 ret = consumer_send_status_msg(sock, ret_code);
1803a064 587 if (ret < 0) {
d771f832 588 /* Somehow, the session daemon is not responding anymore. */
1803a064
MD
589 goto error_fatal;
590 }
9ce5646a
MD
591
592 health_code_update();
593
0c759fc9 594 if (ret_code != LTTCOMM_CONSUMERD_SUCCESS) {
d771f832 595 /* Channel was not found. */
f50f23d9
DG
596 goto end_nosignal;
597 }
598
d771f832 599 /* Blocking call */
9ce5646a
MD
600 health_poll_entry();
601 ret = lttng_consumer_poll_socket(consumer_sockpoll);
602 health_poll_exit();
84382d49
MD
603 if (ret) {
604 goto error_fatal;
3bd1e081 605 }
00e2e675 606
9ce5646a
MD
607 health_code_update();
608
00e2e675 609 /* Get stream file descriptor from socket */
f2fc6720
MD
610 ret = lttcomm_recv_fds_unix_sock(sock, &fd, 1);
611 if (ret != sizeof(fd)) {
f73fabfd 612 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_ERROR_RECV_FD);
3f8e211f 613 rcu_read_unlock();
3bd1e081
MD
614 return ret;
615 }
3bd1e081 616
9ce5646a
MD
617 health_code_update();
618
f50f23d9
DG
619 /*
620 * Send status code to session daemon only if the recv works. If the
621 * above recv() failed, the session daemon is notified through the
622 * error socket and the teardown is eventually done.
623 */
624 ret = consumer_send_status_msg(sock, ret_code);
625 if (ret < 0) {
626 /* Somehow, the session daemon is not responding anymore. */
627 goto end_nosignal;
628 }
629
9ce5646a
MD
630 health_code_update();
631
ffe60014
DG
632 new_stream = consumer_allocate_stream(channel->key,
633 fd,
634 LTTNG_CONSUMER_ACTIVE_STREAM,
635 channel->name,
636 channel->uid,
637 channel->gid,
638 channel->relayd_id,
639 channel->session_id,
640 msg.u.stream.cpu,
641 &alloc_ret,
4891ece8
DG
642 channel->type,
643 channel->monitor);
3bd1e081 644 if (new_stream == NULL) {
c80048c6
MD
645 switch (alloc_ret) {
646 case -ENOMEM:
647 case -EINVAL:
648 default:
649 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_OUTFD_ERROR);
650 break;
c80048c6 651 }
3f8e211f 652 goto end_nosignal;
3bd1e081 653 }
d771f832 654
ffe60014
DG
655 new_stream->chan = channel;
656 new_stream->wait_fd = fd;
07b86b52
JD
657 switch (channel->output) {
658 case CONSUMER_CHANNEL_SPLICE:
659 new_stream->output = LTTNG_EVENT_SPLICE;
a2361a61
JD
660 ret = utils_create_pipe(new_stream->splice_pipe);
661 if (ret < 0) {
662 goto end_nosignal;
663 }
07b86b52
JD
664 break;
665 case CONSUMER_CHANNEL_MMAP:
666 new_stream->output = LTTNG_EVENT_MMAP;
667 break;
668 default:
669 ERR("Stream output unknown %d", channel->output);
670 goto end_nosignal;
671 }
00e2e675 672
a0c83db9
DG
673 /*
674 * We've just assigned the channel to the stream so increment the
07b86b52
JD
675 * refcount right now. We don't need to increment the refcount for
676 * streams in no monitor because we handle manually the cleanup of
677 * those. It is very important to make sure there is NO prior
678 * consumer_del_stream() calls or else the refcount will be unbalanced.
a0c83db9 679 */
07b86b52
JD
680 if (channel->monitor) {
681 uatomic_inc(&new_stream->chan->refcount);
682 }
9d9353f9 683
fb3a43a9
DG
684 /*
685 * The buffer flush is done on the session daemon side for the kernel
686 * so no need for the stream "hangup_flush_done" variable to be
687 * tracked. This is important for a kernel stream since we don't rely
688 * on the flush state of the stream to read data. It's not the case for
689 * user space tracing.
690 */
691 new_stream->hangup_flush_done = 0;
692
9ce5646a
MD
693 health_code_update();
694
633d0084
DG
695 if (ctx->on_recv_stream) {
696 ret = ctx->on_recv_stream(new_stream);
697 if (ret < 0) {
d771f832 698 consumer_stream_free(new_stream);
633d0084 699 goto end_nosignal;
fb3a43a9 700 }
633d0084 701 }
fb3a43a9 702
9ce5646a
MD
703 health_code_update();
704
07b86b52
JD
705 if (new_stream->metadata_flag) {
706 channel->metadata_stream = new_stream;
707 }
708
2bba9e53
DG
709 /* Do not monitor this stream. */
710 if (!channel->monitor) {
5eecee74 711 DBG("Kernel consumer add stream %s in no monitor mode with "
6dc3064a 712 "relayd id %" PRIu64, new_stream->name,
5eecee74 713 new_stream->net_seq_idx);
10a50311 714 cds_list_add(&new_stream->send_node, &channel->streams.head);
6dc3064a
DG
715 break;
716 }
717
e1b71bdc
DG
718 /* Send stream to relayd if the stream has an ID. */
719 if (new_stream->net_seq_idx != (uint64_t) -1ULL) {
194ee077
DG
720 ret = consumer_send_relayd_stream(new_stream,
721 new_stream->chan->pathname);
e1b71bdc
DG
722 if (ret < 0) {
723 consumer_stream_free(new_stream);
724 goto end_nosignal;
725 }
001b7e62
MD
726
727 /*
728 * If adding an extra stream to an already
729 * existing channel (e.g. cpu hotplug), we need
730 * to send the "streams_sent" command to relayd.
731 */
732 if (channel->streams_sent_to_relayd) {
733 ret = consumer_send_relayd_streams_sent(
734 new_stream->net_seq_idx);
735 if (ret < 0) {
736 goto end_nosignal;
737 }
738 }
e2039c7a
JD
739 }
740
50f8ae69 741 /* Get the right pipe where the stream will be sent. */
633d0084 742 if (new_stream->metadata_flag) {
66d583dc 743 consumer_add_metadata_stream(new_stream);
dae10966 744 stream_pipe = ctx->consumer_metadata_pipe;
3bd1e081 745 } else {
66d583dc 746 consumer_add_data_stream(new_stream);
dae10966 747 stream_pipe = ctx->consumer_data_pipe;
50f8ae69
DG
748 }
749
66d583dc 750 /* Visible to other threads */
5ab66908
MD
751 new_stream->globally_visible = 1;
752
9ce5646a
MD
753 health_code_update();
754
dae10966 755 ret = lttng_pipe_write(stream_pipe, &new_stream, sizeof(new_stream));
50f8ae69 756 if (ret < 0) {
dae10966 757 ERR("Consumer write %s stream to pipe %d",
50f8ae69 758 new_stream->metadata_flag ? "metadata" : "data",
dae10966 759 lttng_pipe_get_writefd(stream_pipe));
5ab66908
MD
760 if (new_stream->metadata_flag) {
761 consumer_del_stream_for_metadata(new_stream);
762 } else {
763 consumer_del_stream_for_data(new_stream);
764 }
50f8ae69 765 goto end_nosignal;
3bd1e081 766 }
00e2e675 767
50f8ae69 768 DBG("Kernel consumer ADD_STREAM %s (fd: %d) with relayd id %" PRIu64,
ffe60014 769 new_stream->name, fd, new_stream->relayd_stream_id);
3bd1e081
MD
770 break;
771 }
a4baae1b
JD
772 case LTTNG_CONSUMER_STREAMS_SENT:
773 {
774 struct lttng_consumer_channel *channel;
775
776 /*
777 * Get stream's channel reference. Needed when adding the stream to the
778 * global hash table.
779 */
780 channel = consumer_find_channel(msg.u.sent_streams.channel_key);
781 if (!channel) {
782 /*
783 * We could not find the channel. Can happen if cpu hotplug
784 * happens while tearing down.
785 */
786 ERR("Unable to find channel key %" PRIu64,
787 msg.u.sent_streams.channel_key);
e462382a 788 ret_code = LTTCOMM_CONSUMERD_CHAN_NOT_FOUND;
a4baae1b
JD
789 }
790
791 health_code_update();
792
793 /*
794 * Send status code to session daemon.
795 */
796 ret = consumer_send_status_msg(sock, ret_code);
f261ad0a 797 if (ret < 0 || ret_code != LTTCOMM_CONSUMERD_SUCCESS) {
a4baae1b
JD
798 /* Somehow, the session daemon is not responding anymore. */
799 goto end_nosignal;
800 }
801
802 health_code_update();
803
804 /*
805 * We should not send this message if we don't monitor the
806 * streams in this channel.
807 */
808 if (!channel->monitor) {
809 break;
810 }
811
812 health_code_update();
813 /* Send stream to relayd if the stream has an ID. */
814 if (msg.u.sent_streams.net_seq_idx != (uint64_t) -1ULL) {
815 ret = consumer_send_relayd_streams_sent(
816 msg.u.sent_streams.net_seq_idx);
817 if (ret < 0) {
818 goto end_nosignal;
819 }
001b7e62 820 channel->streams_sent_to_relayd = true;
a4baae1b
JD
821 }
822 break;
823 }
3bd1e081
MD
824 case LTTNG_CONSUMER_UPDATE_STREAM:
825 {
3f8e211f
DG
826 rcu_read_unlock();
827 return -ENOSYS;
828 }
829 case LTTNG_CONSUMER_DESTROY_RELAYD:
830 {
a6ba4fe1 831 uint64_t index = msg.u.destroy_relayd.net_seq_idx;
3f8e211f
DG
832 struct consumer_relayd_sock_pair *relayd;
833
a6ba4fe1 834 DBG("Kernel consumer destroying relayd %" PRIu64, index);
3f8e211f
DG
835
836 /* Get relayd reference if exists. */
a6ba4fe1 837 relayd = consumer_find_relayd(index);
3f8e211f 838 if (relayd == NULL) {
3448e266 839 DBG("Unable to find relayd %" PRIu64, index);
e462382a 840 ret_code = LTTCOMM_CONSUMERD_RELAYD_FAIL;
3bd1e081 841 }
3f8e211f 842
a6ba4fe1
DG
843 /*
844 * Each relayd socket pair has a refcount of stream attached to it
845 * which tells if the relayd is still active or not depending on the
846 * refcount value.
847 *
848 * This will set the destroy flag of the relayd object and destroy it
849 * if the refcount reaches zero when called.
850 *
851 * The destroy can happen either here or when a stream fd hangs up.
852 */
f50f23d9
DG
853 if (relayd) {
854 consumer_flag_relayd_for_destroy(relayd);
855 }
856
9ce5646a
MD
857 health_code_update();
858
f50f23d9
DG
859 ret = consumer_send_status_msg(sock, ret_code);
860 if (ret < 0) {
861 /* Somehow, the session daemon is not responding anymore. */
1803a064 862 goto error_fatal;
f50f23d9 863 }
3f8e211f 864
3f8e211f 865 goto end_nosignal;
3bd1e081 866 }
6d805429 867 case LTTNG_CONSUMER_DATA_PENDING:
53632229 868 {
c8f59ee5 869 int32_t ret;
6d805429 870 uint64_t id = msg.u.data_pending.session_id;
c8f59ee5 871
6d805429 872 DBG("Kernel consumer data pending command for id %" PRIu64, id);
c8f59ee5 873
6d805429 874 ret = consumer_data_pending(id);
c8f59ee5 875
9ce5646a
MD
876 health_code_update();
877
c8f59ee5
DG
878 /* Send back returned value to session daemon */
879 ret = lttcomm_send_unix_sock(sock, &ret, sizeof(ret));
880 if (ret < 0) {
6d805429 881 PERROR("send data pending ret code");
1803a064 882 goto error_fatal;
c8f59ee5 883 }
f50f23d9
DG
884
885 /*
886 * No need to send back a status message since the data pending
887 * returned value is the response.
888 */
c8f59ee5 889 break;
53632229 890 }
6dc3064a
DG
891 case LTTNG_CONSUMER_SNAPSHOT_CHANNEL:
892 {
07b86b52
JD
893 if (msg.u.snapshot_channel.metadata == 1) {
894 ret = lttng_kconsumer_snapshot_metadata(msg.u.snapshot_channel.key,
e2039c7a
JD
895 msg.u.snapshot_channel.pathname,
896 msg.u.snapshot_channel.relayd_id, ctx);
07b86b52
JD
897 if (ret < 0) {
898 ERR("Snapshot metadata failed");
e462382a 899 ret_code = LTTCOMM_CONSUMERD_ERROR_METADATA;
07b86b52
JD
900 }
901 } else {
902 ret = lttng_kconsumer_snapshot_channel(msg.u.snapshot_channel.key,
903 msg.u.snapshot_channel.pathname,
5c786ded 904 msg.u.snapshot_channel.relayd_id,
d07ceecd 905 msg.u.snapshot_channel.nb_packets_per_stream,
5c786ded 906 ctx);
07b86b52
JD
907 if (ret < 0) {
908 ERR("Snapshot channel failed");
e462382a 909 ret_code = LTTCOMM_CONSUMERD_CHAN_NOT_FOUND;
07b86b52
JD
910 }
911 }
912
9ce5646a
MD
913 health_code_update();
914
6dc3064a
DG
915 ret = consumer_send_status_msg(sock, ret_code);
916 if (ret < 0) {
917 /* Somehow, the session daemon is not responding anymore. */
918 goto end_nosignal;
919 }
920 break;
921 }
07b86b52
JD
922 case LTTNG_CONSUMER_DESTROY_CHANNEL:
923 {
924 uint64_t key = msg.u.destroy_channel.key;
925 struct lttng_consumer_channel *channel;
926
927 channel = consumer_find_channel(key);
928 if (!channel) {
929 ERR("Kernel consumer destroy channel %" PRIu64 " not found", key);
e462382a 930 ret_code = LTTCOMM_CONSUMERD_CHAN_NOT_FOUND;
07b86b52
JD
931 }
932
9ce5646a
MD
933 health_code_update();
934
07b86b52
JD
935 ret = consumer_send_status_msg(sock, ret_code);
936 if (ret < 0) {
937 /* Somehow, the session daemon is not responding anymore. */
938 goto end_nosignal;
939 }
940
9ce5646a
MD
941 health_code_update();
942
15dc512a
DG
943 /* Stop right now if no channel was found. */
944 if (!channel) {
945 goto end_nosignal;
946 }
947
07b86b52
JD
948 /*
949 * This command should ONLY be issued for channel with streams set in
950 * no monitor mode.
951 */
952 assert(!channel->monitor);
953
954 /*
955 * The refcount should ALWAYS be 0 in the case of a channel in no
956 * monitor mode.
957 */
958 assert(!uatomic_sub_return(&channel->refcount, 1));
959
960 consumer_del_channel(channel);
961
962 goto end_nosignal;
963 }
fb83fe64
JD
964 case LTTNG_CONSUMER_DISCARDED_EVENTS:
965 {
66ab32be
JD
966 ssize_t ret;
967 uint64_t count;
fb83fe64
JD
968 struct lttng_consumer_channel *channel;
969 uint64_t id = msg.u.discarded_events.session_id;
970 uint64_t key = msg.u.discarded_events.channel_key;
971
e5742757
MD
972 DBG("Kernel consumer discarded events command for session id %"
973 PRIu64 ", channel key %" PRIu64, id, key);
974
fb83fe64
JD
975 channel = consumer_find_channel(key);
976 if (!channel) {
977 ERR("Kernel consumer discarded events channel %"
978 PRIu64 " not found", key);
66ab32be 979 count = 0;
e5742757 980 } else {
66ab32be 981 count = channel->discarded_events;
fb83fe64
JD
982 }
983
fb83fe64
JD
984 health_code_update();
985
986 /* Send back returned value to session daemon */
66ab32be 987 ret = lttcomm_send_unix_sock(sock, &count, sizeof(count));
fb83fe64
JD
988 if (ret < 0) {
989 PERROR("send discarded events");
990 goto error_fatal;
991 }
992
993 break;
994 }
995 case LTTNG_CONSUMER_LOST_PACKETS:
996 {
66ab32be
JD
997 ssize_t ret;
998 uint64_t count;
fb83fe64
JD
999 struct lttng_consumer_channel *channel;
1000 uint64_t id = msg.u.lost_packets.session_id;
1001 uint64_t key = msg.u.lost_packets.channel_key;
1002
e5742757
MD
1003 DBG("Kernel consumer lost packets command for session id %"
1004 PRIu64 ", channel key %" PRIu64, id, key);
1005
fb83fe64
JD
1006 channel = consumer_find_channel(key);
1007 if (!channel) {
1008 ERR("Kernel consumer lost packets channel %"
1009 PRIu64 " not found", key);
66ab32be 1010 count = 0;
e5742757 1011 } else {
66ab32be 1012 count = channel->lost_packets;
fb83fe64
JD
1013 }
1014
fb83fe64
JD
1015 health_code_update();
1016
1017 /* Send back returned value to session daemon */
66ab32be 1018 ret = lttcomm_send_unix_sock(sock, &count, sizeof(count));
fb83fe64
JD
1019 if (ret < 0) {
1020 PERROR("send lost packets");
1021 goto error_fatal;
1022 }
1023
1024 break;
1025 }
b3530820
JG
1026 case LTTNG_CONSUMER_SET_CHANNEL_MONITOR_PIPE:
1027 {
1028 int channel_monitor_pipe;
1029
1030 ret_code = LTTCOMM_CONSUMERD_SUCCESS;
1031 /* Successfully received the command's type. */
1032 ret = consumer_send_status_msg(sock, ret_code);
1033 if (ret < 0) {
1034 goto error_fatal;
1035 }
1036
1037 ret = lttcomm_recv_fds_unix_sock(sock, &channel_monitor_pipe,
1038 1);
1039 if (ret != sizeof(channel_monitor_pipe)) {
1040 ERR("Failed to receive channel monitor pipe");
1041 goto error_fatal;
1042 }
1043
1044 DBG("Received channel monitor pipe (%d)", channel_monitor_pipe);
1045 ret = consumer_timer_thread_set_channel_monitor_pipe(
1046 channel_monitor_pipe);
1047 if (!ret) {
1048 int flags;
1049
1050 ret_code = LTTCOMM_CONSUMERD_SUCCESS;
1051 /* Set the pipe as non-blocking. */
1052 ret = fcntl(channel_monitor_pipe, F_GETFL, 0);
1053 if (ret == -1) {
1054 PERROR("fcntl get flags of the channel monitoring pipe");
1055 goto error_fatal;
1056 }
1057 flags = ret;
1058
1059 ret = fcntl(channel_monitor_pipe, F_SETFL,
1060 flags | O_NONBLOCK);
1061 if (ret == -1) {
1062 PERROR("fcntl set O_NONBLOCK flag of the channel monitoring pipe");
1063 goto error_fatal;
1064 }
1065 DBG("Channel monitor pipe set as non-blocking");
1066 } else {
1067 ret_code = LTTCOMM_CONSUMERD_ALREADY_SET;
1068 }
1069 ret = consumer_send_status_msg(sock, ret_code);
1070 if (ret < 0) {
1071 goto error_fatal;
1072 }
1073 break;
1074 }
3bd1e081 1075 default:
3f8e211f 1076 goto end_nosignal;
3bd1e081 1077 }
3f8e211f 1078
3bd1e081 1079end_nosignal:
b0b335c8 1080 rcu_read_unlock();
4cbc1a04
DG
1081
1082 /*
1083 * Return 1 to indicate success since the 0 value can be a socket
1084 * shutdown during the recv() or send() call.
1085 */
9ce5646a 1086 health_code_update();
4cbc1a04 1087 return 1;
1803a064
MD
1088
1089error_fatal:
1090 rcu_read_unlock();
1091 /* This will issue a consumer stop. */
1092 return -1;
3bd1e081 1093}
d41f73b7 1094
309167d2
JD
1095/*
1096 * Populate index values of a kernel stream. Values are set in big endian order.
1097 *
1098 * Return 0 on success or else a negative value.
1099 */
50adc264 1100static int get_index_values(struct ctf_packet_index *index, int infd)
309167d2
JD
1101{
1102 int ret;
1103
1104 ret = kernctl_get_timestamp_begin(infd, &index->timestamp_begin);
1105 if (ret < 0) {
1106 PERROR("kernctl_get_timestamp_begin");
1107 goto error;
1108 }
1109 index->timestamp_begin = htobe64(index->timestamp_begin);
1110
1111 ret = kernctl_get_timestamp_end(infd, &index->timestamp_end);
1112 if (ret < 0) {
1113 PERROR("kernctl_get_timestamp_end");
1114 goto error;
1115 }
1116 index->timestamp_end = htobe64(index->timestamp_end);
1117
1118 ret = kernctl_get_events_discarded(infd, &index->events_discarded);
1119 if (ret < 0) {
1120 PERROR("kernctl_get_events_discarded");
1121 goto error;
1122 }
1123 index->events_discarded = htobe64(index->events_discarded);
1124
1125 ret = kernctl_get_content_size(infd, &index->content_size);
1126 if (ret < 0) {
1127 PERROR("kernctl_get_content_size");
1128 goto error;
1129 }
1130 index->content_size = htobe64(index->content_size);
1131
1132 ret = kernctl_get_packet_size(infd, &index->packet_size);
1133 if (ret < 0) {
1134 PERROR("kernctl_get_packet_size");
1135 goto error;
1136 }
1137 index->packet_size = htobe64(index->packet_size);
1138
1139 ret = kernctl_get_stream_id(infd, &index->stream_id);
1140 if (ret < 0) {
1141 PERROR("kernctl_get_stream_id");
1142 goto error;
1143 }
1144 index->stream_id = htobe64(index->stream_id);
1145
234cd636
JD
1146 ret = kernctl_get_instance_id(infd, &index->stream_instance_id);
1147 if (ret < 0) {
f0b03c22
MD
1148 if (ret == -ENOTTY) {
1149 /* Command not implemented by lttng-modules. */
1150 index->stream_instance_id = -1ULL;
f0b03c22
MD
1151 } else {
1152 PERROR("kernctl_get_instance_id");
1153 goto error;
1154 }
234cd636
JD
1155 }
1156 index->stream_instance_id = htobe64(index->stream_instance_id);
1157
1158 ret = kernctl_get_sequence_number(infd, &index->packet_seq_num);
1159 if (ret < 0) {
f0b03c22
MD
1160 if (ret == -ENOTTY) {
1161 /* Command not implemented by lttng-modules. */
1162 index->packet_seq_num = -1ULL;
1163 ret = 0;
1164 } else {
1165 PERROR("kernctl_get_sequence_number");
1166 goto error;
1167 }
234cd636
JD
1168 }
1169 index->packet_seq_num = htobe64(index->packet_seq_num);
1170
309167d2
JD
1171error:
1172 return ret;
1173}
94d49140
JD
1174/*
1175 * Sync metadata meaning request them to the session daemon and snapshot to the
1176 * metadata thread can consumer them.
1177 *
1178 * Metadata stream lock MUST be acquired.
1179 *
1180 * Return 0 if new metadatda is available, EAGAIN if the metadata stream
1181 * is empty or a negative value on error.
1182 */
1183int lttng_kconsumer_sync_metadata(struct lttng_consumer_stream *metadata)
1184{
1185 int ret;
1186
1187 assert(metadata);
1188
1189 ret = kernctl_buffer_flush(metadata->wait_fd);
1190 if (ret < 0) {
1191 ERR("Failed to flush kernel stream");
1192 goto end;
1193 }
1194
1195 ret = kernctl_snapshot(metadata->wait_fd);
1196 if (ret < 0) {
32af2c95 1197 if (ret != -EAGAIN) {
94d49140
JD
1198 ERR("Sync metadata, taking kernel snapshot failed.");
1199 goto end;
1200 }
1201 DBG("Sync metadata, no new kernel metadata");
1202 /* No new metadata, exit. */
1203 ret = ENODATA;
1204 goto end;
1205 }
1206
1207end:
1208 return ret;
1209}
309167d2 1210
fb83fe64
JD
1211static
1212int update_stream_stats(struct lttng_consumer_stream *stream)
1213{
1214 int ret;
1215 uint64_t seq, discarded;
1216
1217 ret = kernctl_get_sequence_number(stream->wait_fd, &seq);
1218 if (ret < 0) {
f0b03c22
MD
1219 if (ret == -ENOTTY) {
1220 /* Command not implemented by lttng-modules. */
1221 seq = -1ULL;
f0b03c22
MD
1222 } else {
1223 PERROR("kernctl_get_sequence_number");
1224 goto end;
1225 }
fb83fe64
JD
1226 }
1227
1228 /*
1229 * Start the sequence when we extract the first packet in case we don't
1230 * start at 0 (for example if a consumer is not connected to the
1231 * session immediately after the beginning).
1232 */
1233 if (stream->last_sequence_number == -1ULL) {
1234 stream->last_sequence_number = seq;
1235 } else if (seq > stream->last_sequence_number) {
1236 stream->chan->lost_packets += seq -
1237 stream->last_sequence_number - 1;
1238 } else {
1239 /* seq <= last_sequence_number */
1240 ERR("Sequence number inconsistent : prev = %" PRIu64
1241 ", current = %" PRIu64,
1242 stream->last_sequence_number, seq);
1243 ret = -1;
1244 goto end;
1245 }
1246 stream->last_sequence_number = seq;
1247
1248 ret = kernctl_get_events_discarded(stream->wait_fd, &discarded);
1249 if (ret < 0) {
1250 PERROR("kernctl_get_events_discarded");
1251 goto end;
1252 }
1253 if (discarded < stream->last_discarded_events) {
1254 /*
83f4233d
MJ
1255 * Overflow has occurred. We assume only one wrap-around
1256 * has occurred.
fb83fe64
JD
1257 */
1258 stream->chan->discarded_events += (1ULL << (CAA_BITS_PER_LONG - 1)) -
1259 stream->last_discarded_events + discarded;
1260 } else {
1261 stream->chan->discarded_events += discarded -
1262 stream->last_discarded_events;
1263 }
1264 stream->last_discarded_events = discarded;
1265 ret = 0;
1266
1267end:
1268 return ret;
1269}
1270
93ec662e
JD
1271/*
1272 * Check if the local version of the metadata stream matches with the version
1273 * of the metadata stream in the kernel. If it was updated, set the reset flag
1274 * on the stream.
1275 */
1276static
1277int metadata_stream_check_version(int infd, struct lttng_consumer_stream *stream)
1278{
1279 int ret;
1280 uint64_t cur_version;
1281
1282 ret = kernctl_get_metadata_version(infd, &cur_version);
1283 if (ret < 0) {
f0b03c22
MD
1284 if (ret == -ENOTTY) {
1285 /*
1286 * LTTng-modules does not implement this
1287 * command.
1288 */
1289 ret = 0;
1290 goto end;
1291 }
93ec662e
JD
1292 ERR("Failed to get the metadata version");
1293 goto end;
1294 }
1295
1296 if (stream->metadata_version == cur_version) {
1297 ret = 0;
1298 goto end;
1299 }
1300
1301 DBG("New metadata version detected");
1302 stream->metadata_version = cur_version;
1303 stream->reset_metadata_flag = 1;
1304 ret = 0;
1305
1306end:
1307 return ret;
1308}
1309
d41f73b7
MD
1310/*
1311 * Consume data on a file descriptor and write it on a trace file.
1312 */
4078b776 1313ssize_t lttng_kconsumer_read_subbuffer(struct lttng_consumer_stream *stream,
d41f73b7
MD
1314 struct lttng_consumer_local_data *ctx)
1315{
1d4dfdef 1316 unsigned long len, subbuf_size, padding;
1c20f0e2 1317 int err, write_index = 1;
4078b776 1318 ssize_t ret = 0;
d41f73b7 1319 int infd = stream->wait_fd;
50adc264 1320 struct ctf_packet_index index;
d41f73b7
MD
1321
1322 DBG("In read_subbuffer (infd : %d)", infd);
309167d2 1323
d41f73b7
MD
1324 /* Get the next subbuffer */
1325 err = kernctl_get_next_subbuf(infd);
1326 if (err != 0) {
d41f73b7
MD
1327 /*
1328 * This is a debug message even for single-threaded consumer,
1329 * because poll() have more relaxed criterions than get subbuf,
1330 * so get_subbuf may fail for short race windows where poll()
1331 * would issue wakeups.
1332 */
1333 DBG("Reserving sub buffer failed (everything is normal, "
1334 "it is due to concurrency)");
32af2c95 1335 ret = err;
d41f73b7
MD
1336 goto end;
1337 }
1338
1d4dfdef
DG
1339 /* Get the full subbuffer size including padding */
1340 err = kernctl_get_padded_subbuf_size(infd, &len);
1341 if (err != 0) {
5a510c9f 1342 PERROR("Getting sub-buffer len failed.");
8265f19e
MD
1343 err = kernctl_put_subbuf(infd);
1344 if (err != 0) {
32af2c95 1345 if (err == -EFAULT) {
5a510c9f 1346 PERROR("Error in unreserving sub buffer\n");
32af2c95 1347 } else if (err == -EIO) {
8265f19e 1348 /* Should never happen with newer LTTng versions */
5a510c9f 1349 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
8265f19e 1350 }
32af2c95 1351 ret = err;
8265f19e
MD
1352 goto end;
1353 }
32af2c95 1354 ret = err;
1d4dfdef
DG
1355 goto end;
1356 }
1357
1c20f0e2 1358 if (!stream->metadata_flag) {
309167d2
JD
1359 ret = get_index_values(&index, infd);
1360 if (ret < 0) {
8265f19e
MD
1361 err = kernctl_put_subbuf(infd);
1362 if (err != 0) {
32af2c95 1363 if (err == -EFAULT) {
5a510c9f 1364 PERROR("Error in unreserving sub buffer\n");
32af2c95 1365 } else if (err == -EIO) {
8265f19e 1366 /* Should never happen with newer LTTng versions */
5a510c9f 1367 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
8265f19e 1368 }
32af2c95 1369 ret = err;
8265f19e
MD
1370 goto end;
1371 }
309167d2
JD
1372 goto end;
1373 }
fb83fe64
JD
1374 ret = update_stream_stats(stream);
1375 if (ret < 0) {
7b87473d
MD
1376 err = kernctl_put_subbuf(infd);
1377 if (err != 0) {
1378 if (err == -EFAULT) {
1379 PERROR("Error in unreserving sub buffer\n");
1380 } else if (err == -EIO) {
1381 /* Should never happen with newer LTTng versions */
1382 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
1383 }
1384 ret = err;
1385 goto end;
1386 }
fb83fe64
JD
1387 goto end;
1388 }
1c20f0e2
JD
1389 } else {
1390 write_index = 0;
93ec662e
JD
1391 ret = metadata_stream_check_version(infd, stream);
1392 if (ret < 0) {
7b87473d
MD
1393 err = kernctl_put_subbuf(infd);
1394 if (err != 0) {
1395 if (err == -EFAULT) {
1396 PERROR("Error in unreserving sub buffer\n");
1397 } else if (err == -EIO) {
1398 /* Should never happen with newer LTTng versions */
1399 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
1400 }
1401 ret = err;
1402 goto end;
1403 }
93ec662e
JD
1404 goto end;
1405 }
309167d2
JD
1406 }
1407
ffe60014 1408 switch (stream->chan->output) {
07b86b52 1409 case CONSUMER_CHANNEL_SPLICE:
1d4dfdef
DG
1410 /*
1411 * XXX: The lttng-modules splice "actor" does not handle copying
1412 * partial pages hence only using the subbuffer size without the
1413 * padding makes the splice fail.
1414 */
1415 subbuf_size = len;
1416 padding = 0;
1417
1418 /* splice the subbuffer to the tracefile */
91dfef6e 1419 ret = lttng_consumer_on_read_subbuffer_splice(ctx, stream, subbuf_size,
309167d2 1420 padding, &index);
91dfef6e
DG
1421 /*
1422 * XXX: Splice does not support network streaming so the return value
1423 * is simply checked against subbuf_size and not like the mmap() op.
1424 */
1d4dfdef
DG
1425 if (ret != subbuf_size) {
1426 /*
1427 * display the error but continue processing to try
1428 * to release the subbuffer
1429 */
1430 ERR("Error splicing to tracefile (ret: %zd != len: %lu)",
1431 ret, subbuf_size);
309167d2 1432 write_index = 0;
1d4dfdef
DG
1433 }
1434 break;
07b86b52 1435 case CONSUMER_CHANNEL_MMAP:
1d4dfdef
DG
1436 /* Get subbuffer size without padding */
1437 err = kernctl_get_subbuf_size(infd, &subbuf_size);
1438 if (err != 0) {
5a510c9f 1439 PERROR("Getting sub-buffer len failed.");
8265f19e
MD
1440 err = kernctl_put_subbuf(infd);
1441 if (err != 0) {
32af2c95 1442 if (err == -EFAULT) {
5a510c9f 1443 PERROR("Error in unreserving sub buffer\n");
32af2c95 1444 } else if (err == -EIO) {
8265f19e 1445 /* Should never happen with newer LTTng versions */
5a510c9f 1446 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
8265f19e 1447 }
32af2c95 1448 ret = err;
8265f19e
MD
1449 goto end;
1450 }
32af2c95 1451 ret = err;
1d4dfdef
DG
1452 goto end;
1453 }
47e81c02 1454
1d4dfdef
DG
1455 /* Make sure the tracer is not gone mad on us! */
1456 assert(len >= subbuf_size);
1457
1458 padding = len - subbuf_size;
1459
1460 /* write the subbuffer to the tracefile */
91dfef6e 1461 ret = lttng_consumer_on_read_subbuffer_mmap(ctx, stream, subbuf_size,
309167d2 1462 padding, &index);
91dfef6e
DG
1463 /*
1464 * The mmap operation should write subbuf_size amount of data when
1465 * network streaming or the full padding (len) size when we are _not_
1466 * streaming.
1467 */
d88aee68
DG
1468 if ((ret != subbuf_size && stream->net_seq_idx != (uint64_t) -1ULL) ||
1469 (ret != len && stream->net_seq_idx == (uint64_t) -1ULL)) {
1d4dfdef 1470 /*
91dfef6e 1471 * Display the error but continue processing to try to release the
2336629e
DG
1472 * subbuffer. This is a DBG statement since this is possible to
1473 * happen without being a critical error.
1d4dfdef 1474 */
2336629e 1475 DBG("Error writing to tracefile "
91dfef6e
DG
1476 "(ret: %zd != len: %lu != subbuf_size: %lu)",
1477 ret, len, subbuf_size);
309167d2 1478 write_index = 0;
1d4dfdef
DG
1479 }
1480 break;
1481 default:
1482 ERR("Unknown output method");
56591bac 1483 ret = -EPERM;
d41f73b7
MD
1484 }
1485
1486 err = kernctl_put_next_subbuf(infd);
1487 if (err != 0) {
32af2c95 1488 if (err == -EFAULT) {
5a510c9f 1489 PERROR("Error in unreserving sub buffer\n");
32af2c95 1490 } else if (err == -EIO) {
d41f73b7 1491 /* Should never happen with newer LTTng versions */
5a510c9f 1492 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
d41f73b7 1493 }
32af2c95 1494 ret = err;
d41f73b7
MD
1495 goto end;
1496 }
1497
309167d2 1498 /* Write index if needed. */
1c20f0e2
JD
1499 if (!write_index) {
1500 goto end;
1501 }
1502
94d49140
JD
1503 if (stream->chan->live_timer_interval && !stream->metadata_flag) {
1504 /*
1505 * In live, block until all the metadata is sent.
1506 */
c585821b
MD
1507 pthread_mutex_lock(&stream->metadata_timer_lock);
1508 assert(!stream->missed_metadata_flush);
1509 stream->waiting_on_metadata = true;
1510 pthread_mutex_unlock(&stream->metadata_timer_lock);
1511
94d49140 1512 err = consumer_stream_sync_metadata(ctx, stream->session_id);
c585821b
MD
1513
1514 pthread_mutex_lock(&stream->metadata_timer_lock);
1515 stream->waiting_on_metadata = false;
1516 if (stream->missed_metadata_flush) {
1517 stream->missed_metadata_flush = false;
1518 pthread_mutex_unlock(&stream->metadata_timer_lock);
1519 (void) consumer_flush_kernel_index(stream);
1520 } else {
1521 pthread_mutex_unlock(&stream->metadata_timer_lock);
1522 }
94d49140
JD
1523 if (err < 0) {
1524 goto end;
1525 }
1526 }
1527
1c20f0e2
JD
1528 err = consumer_stream_write_index(stream, &index);
1529 if (err < 0) {
1530 goto end;
309167d2
JD
1531 }
1532
d41f73b7
MD
1533end:
1534 return ret;
1535}
1536
1537int lttng_kconsumer_on_recv_stream(struct lttng_consumer_stream *stream)
1538{
1539 int ret;
ffe60014
DG
1540
1541 assert(stream);
1542
2bba9e53
DG
1543 /*
1544 * Don't create anything if this is set for streaming or should not be
1545 * monitored.
1546 */
1547 if (stream->net_seq_idx == (uint64_t) -1ULL && stream->chan->monitor) {
fe4477ee
JD
1548 ret = utils_create_stream_file(stream->chan->pathname, stream->name,
1549 stream->chan->tracefile_size, stream->tracefile_count_current,
309167d2 1550 stream->uid, stream->gid, NULL);
fe4477ee
JD
1551 if (ret < 0) {
1552 goto error;
1553 }
1554 stream->out_fd = ret;
1555 stream->tracefile_size_current = 0;
309167d2
JD
1556
1557 if (!stream->metadata_flag) {
f8f3885c
MD
1558 struct lttng_index_file *index_file;
1559
1560 index_file = lttng_index_file_create(stream->chan->pathname,
309167d2
JD
1561 stream->name, stream->uid, stream->gid,
1562 stream->chan->tracefile_size,
f8f3885c
MD
1563 stream->tracefile_count_current,
1564 CTF_INDEX_MAJOR, CTF_INDEX_MINOR);
1565 if (!index_file) {
309167d2
JD
1566 goto error;
1567 }
1b47ae58 1568 assert(!stream->index_file);
f8f3885c 1569 stream->index_file = index_file;
309167d2 1570 }
ffe60014 1571 }
d41f73b7 1572
d41f73b7
MD
1573 if (stream->output == LTTNG_EVENT_MMAP) {
1574 /* get the len of the mmap region */
1575 unsigned long mmap_len;
1576
1577 ret = kernctl_get_mmap_len(stream->wait_fd, &mmap_len);
1578 if (ret != 0) {
ffe60014 1579 PERROR("kernctl_get_mmap_len");
d41f73b7
MD
1580 goto error_close_fd;
1581 }
1582 stream->mmap_len = (size_t) mmap_len;
1583
ffe60014
DG
1584 stream->mmap_base = mmap(NULL, stream->mmap_len, PROT_READ,
1585 MAP_PRIVATE, stream->wait_fd, 0);
d41f73b7 1586 if (stream->mmap_base == MAP_FAILED) {
ffe60014 1587 PERROR("Error mmaping");
d41f73b7
MD
1588 ret = -1;
1589 goto error_close_fd;
1590 }
1591 }
1592
1593 /* we return 0 to let the library handle the FD internally */
1594 return 0;
1595
1596error_close_fd:
2f225ce2 1597 if (stream->out_fd >= 0) {
d41f73b7
MD
1598 int err;
1599
1600 err = close(stream->out_fd);
1601 assert(!err);
2f225ce2 1602 stream->out_fd = -1;
d41f73b7
MD
1603 }
1604error:
1605 return ret;
1606}
1607
ca22feea
DG
1608/*
1609 * Check if data is still being extracted from the buffers for a specific
4e9a4686
DG
1610 * stream. Consumer data lock MUST be acquired before calling this function
1611 * and the stream lock.
ca22feea 1612 *
6d805429 1613 * Return 1 if the traced data are still getting read else 0 meaning that the
ca22feea
DG
1614 * data is available for trace viewer reading.
1615 */
6d805429 1616int lttng_kconsumer_data_pending(struct lttng_consumer_stream *stream)
ca22feea
DG
1617{
1618 int ret;
1619
1620 assert(stream);
1621
873b9e9a
MD
1622 if (stream->endpoint_status != CONSUMER_ENDPOINT_ACTIVE) {
1623 ret = 0;
1624 goto end;
1625 }
1626
ca22feea
DG
1627 ret = kernctl_get_next_subbuf(stream->wait_fd);
1628 if (ret == 0) {
1629 /* There is still data so let's put back this subbuffer. */
1630 ret = kernctl_put_subbuf(stream->wait_fd);
1631 assert(ret == 0);
6d805429 1632 ret = 1; /* Data is pending */
4e9a4686 1633 goto end;
ca22feea
DG
1634 }
1635
6d805429
DG
1636 /* Data is NOT pending and ready to be read. */
1637 ret = 0;
ca22feea 1638
6efae65e
DG
1639end:
1640 return ret;
ca22feea 1641}
This page took 0.152905 seconds and 5 git commands to generate.