consumerd: tag metadata channel as being part of a live session
[lttng-tools.git] / src / common / kernel-consumer / kernel-consumer.c
CommitLineData
3bd1e081
MD
1/*
2 * Copyright (C) 2011 - Julien Desfossez <julien.desfossez@polymtl.ca>
3 * Mathieu Desnoyers <mathieu.desnoyers@efficios.com>
4 *
d14d33bf
AM
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License, version 2 only,
7 * as published by the Free Software Foundation.
3bd1e081
MD
8 *
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
13 *
d14d33bf
AM
14 * You should have received a copy of the GNU General Public License along
15 * with this program; if not, write to the Free Software Foundation, Inc.,
16 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
3bd1e081
MD
17 */
18
ace0e591 19#include "common/buffer-view.h"
1fdb9a78 20#include <stdint.h>
6c1c0768 21#define _LGPL_SOURCE
3bd1e081 22#include <assert.h>
3bd1e081
MD
23#include <poll.h>
24#include <pthread.h>
25#include <stdlib.h>
26#include <string.h>
27#include <sys/mman.h>
28#include <sys/socket.h>
29#include <sys/types.h>
77c7c900 30#include <inttypes.h>
3bd1e081 31#include <unistd.h>
dbb5dfe6 32#include <sys/stat.h>
3bd1e081 33
51a9e1c7 34#include <bin/lttng-consumerd/health-consumerd.h>
990570ed 35#include <common/common.h>
10a8a223 36#include <common/kernel-ctl/kernel-ctl.h>
10a8a223 37#include <common/sessiond-comm/sessiond-comm.h>
00e2e675 38#include <common/sessiond-comm/relayd.h>
dbb5dfe6 39#include <common/compat/fcntl.h>
f263b7fd 40#include <common/compat/endian.h>
acdb9057 41#include <common/pipe.h>
00e2e675 42#include <common/relayd/relayd.h>
fe4477ee 43#include <common/utils.h>
c8fea79c 44#include <common/consumer/consumer-stream.h>
309167d2 45#include <common/index/index.h>
c8fea79c 46#include <common/consumer/consumer-timer.h>
0857097f 47
10a8a223 48#include "kernel-consumer.h"
3bd1e081
MD
49
50extern struct lttng_consumer_global_data consumer_data;
51extern int consumer_poll_timeout;
52extern volatile int consumer_quit;
53
3bd1e081
MD
54/*
55 * Take a snapshot for a specific fd
56 *
57 * Returns 0 on success, < 0 on error
58 */
ffe60014 59int lttng_kconsumer_take_snapshot(struct lttng_consumer_stream *stream)
3bd1e081
MD
60{
61 int ret = 0;
62 int infd = stream->wait_fd;
63
64 ret = kernctl_snapshot(infd);
ee6bb36a
JD
65 /*
66 * -EAGAIN is not an error, it just means that there is no data to
67 * be read.
68 */
69 if (ret != 0 && ret != -EAGAIN) {
5a510c9f 70 PERROR("Getting sub-buffer snapshot.");
3bd1e081
MD
71 }
72
73 return ret;
74}
75
76/*
77 * Get the produced position
78 *
79 * Returns 0 on success, < 0 on error
80 */
ffe60014 81int lttng_kconsumer_get_produced_snapshot(struct lttng_consumer_stream *stream,
3bd1e081
MD
82 unsigned long *pos)
83{
84 int ret;
85 int infd = stream->wait_fd;
86
87 ret = kernctl_snapshot_get_produced(infd, pos);
88 if (ret != 0) {
5a510c9f 89 PERROR("kernctl_snapshot_get_produced");
3bd1e081
MD
90 }
91
92 return ret;
93}
94
07b86b52
JD
95/*
96 * Get the consumerd position
97 *
98 * Returns 0 on success, < 0 on error
99 */
100int lttng_kconsumer_get_consumed_snapshot(struct lttng_consumer_stream *stream,
101 unsigned long *pos)
102{
103 int ret;
104 int infd = stream->wait_fd;
105
106 ret = kernctl_snapshot_get_consumed(infd, pos);
107 if (ret != 0) {
5a510c9f 108 PERROR("kernctl_snapshot_get_consumed");
07b86b52
JD
109 }
110
111 return ret;
112}
113
1fdb9a78
JG
114static
115int get_current_subbuf_addr(struct lttng_consumer_stream *stream,
116 const char **addr)
117{
118 int ret;
119 unsigned long mmap_offset;
120 const char *mmap_base = stream->mmap_base;
121
122 ret = kernctl_get_mmap_read_offset(stream->wait_fd, &mmap_offset);
123 if (ret < 0) {
124 PERROR("Failed to get mmap read offset");
125 goto error;
126 }
127
128 *addr = mmap_base + mmap_offset;
129error:
130 return ret;
131}
132
07b86b52
JD
133/*
134 * Take a snapshot of all the stream of a channel
135 *
136 * Returns 0 on success, < 0 on error
137 */
138int lttng_kconsumer_snapshot_channel(uint64_t key, char *path,
d07ceecd 139 uint64_t relayd_id, uint64_t nb_packets_per_stream,
5c786ded 140 struct lttng_consumer_local_data *ctx)
07b86b52
JD
141{
142 int ret;
07b86b52
JD
143 struct lttng_consumer_channel *channel;
144 struct lttng_consumer_stream *stream;
145
6a00837f 146 DBG("Kernel consumer snapshot channel %" PRIu64, key);
07b86b52
JD
147
148 rcu_read_lock();
149
150 channel = consumer_find_channel(key);
151 if (!channel) {
6a00837f 152 ERR("No channel found for key %" PRIu64, key);
07b86b52
JD
153 ret = -1;
154 goto end;
155 }
156
157 /* Splice is not supported yet for channel snapshot. */
158 if (channel->output != CONSUMER_CHANNEL_MMAP) {
159 ERR("Unsupported output %d", channel->output);
160 ret = -1;
161 goto end;
162 }
163
10a50311 164 cds_list_for_each_entry(stream, &channel->streams.head, send_node) {
923333cd 165 unsigned long consumed_pos, produced_pos;
9ce5646a
MD
166
167 health_code_update();
168
07b86b52
JD
169 /*
170 * Lock stream because we are about to change its state.
171 */
172 pthread_mutex_lock(&stream->lock);
173
29decac3
DG
174 /*
175 * Assign the received relayd ID so we can use it for streaming. The streams
176 * are not visible to anyone so this is OK to change it.
177 */
6d40f8fa 178 stream->relayd_id = relayd_id;
07b86b52
JD
179 channel->relayd_id = relayd_id;
180 if (relayd_id != (uint64_t) -1ULL) {
10a50311 181 ret = consumer_send_relayd_stream(stream, path);
07b86b52
JD
182 if (ret < 0) {
183 ERR("sending stream to relayd");
184 goto end_unlock;
185 }
07b86b52
JD
186 } else {
187 ret = utils_create_stream_file(path, stream->name,
10a50311
JD
188 stream->chan->tracefile_size,
189 stream->tracefile_count_current,
309167d2 190 stream->uid, stream->gid, NULL);
07b86b52
JD
191 if (ret < 0) {
192 ERR("utils_create_stream_file");
193 goto end_unlock;
194 }
195
196 stream->out_fd = ret;
197 stream->tracefile_size_current = 0;
198
81ea21bf
MD
199 DBG("Kernel consumer snapshot stream %s/%s (%" PRIu64 ")",
200 path, stream->name, stream->key);
07b86b52 201 }
601262d6
JD
202 if (relayd_id != -1ULL) {
203 ret = consumer_send_relayd_streams_sent(relayd_id);
204 if (ret < 0) {
205 ERR("sending streams sent to relayd");
206 goto end_unlock;
207 }
b7fa98e6 208 channel->streams_sent_to_relayd = true;
a4baae1b 209 }
07b86b52 210
612b8ed8 211 ret = kernctl_buffer_flush_empty(stream->wait_fd);
07b86b52 212 if (ret < 0) {
612b8ed8
MD
213 /*
214 * Doing a buffer flush which does not take into
215 * account empty packets. This is not perfect
216 * for stream intersection, but required as a
217 * fall-back when "flush_empty" is not
218 * implemented by lttng-modules.
219 */
220 ret = kernctl_buffer_flush(stream->wait_fd);
221 if (ret < 0) {
222 ERR("Failed to flush kernel stream");
223 goto end_unlock;
224 }
07b86b52
JD
225 goto end_unlock;
226 }
227
228 ret = lttng_kconsumer_take_snapshot(stream);
229 if (ret < 0) {
230 ERR("Taking kernel snapshot");
231 goto end_unlock;
232 }
233
234 ret = lttng_kconsumer_get_produced_snapshot(stream, &produced_pos);
235 if (ret < 0) {
236 ERR("Produced kernel snapshot position");
237 goto end_unlock;
238 }
239
240 ret = lttng_kconsumer_get_consumed_snapshot(stream, &consumed_pos);
241 if (ret < 0) {
242 ERR("Consumerd kernel snapshot position");
243 goto end_unlock;
244 }
245
246 if (stream->max_sb_size == 0) {
247 ret = kernctl_get_max_subbuf_size(stream->wait_fd,
248 &stream->max_sb_size);
249 if (ret < 0) {
250 ERR("Getting kernel max_sb_size");
251 goto end_unlock;
252 }
253 }
254
d07ceecd
MD
255 consumed_pos = consumer_get_consume_start_pos(consumed_pos,
256 produced_pos, nb_packets_per_stream,
257 stream->max_sb_size);
5c786ded 258
07b86b52
JD
259 while (consumed_pos < produced_pos) {
260 ssize_t read_len;
261 unsigned long len, padded_len;
1fdb9a78 262 const char *subbuf_addr;
ace0e591 263 struct lttng_buffer_view subbuf_view;
07b86b52 264
9ce5646a 265 health_code_update();
07b86b52
JD
266 DBG("Kernel consumer taking snapshot at pos %lu", consumed_pos);
267
268 ret = kernctl_get_subbuf(stream->wait_fd, &consumed_pos);
269 if (ret < 0) {
32af2c95 270 if (ret != -EAGAIN) {
07b86b52
JD
271 PERROR("kernctl_get_subbuf snapshot");
272 goto end_unlock;
273 }
274 DBG("Kernel consumer get subbuf failed. Skipping it.");
275 consumed_pos += stream->max_sb_size;
6e1f2e92 276 stream->chan->lost_packets++;
07b86b52
JD
277 continue;
278 }
279
280 ret = kernctl_get_subbuf_size(stream->wait_fd, &len);
281 if (ret < 0) {
282 ERR("Snapshot kernctl_get_subbuf_size");
29decac3 283 goto error_put_subbuf;
07b86b52
JD
284 }
285
286 ret = kernctl_get_padded_subbuf_size(stream->wait_fd, &padded_len);
287 if (ret < 0) {
288 ERR("Snapshot kernctl_get_padded_subbuf_size");
29decac3 289 goto error_put_subbuf;
07b86b52
JD
290 }
291
1fdb9a78
JG
292 ret = get_current_subbuf_addr(stream, &subbuf_addr);
293 if (ret) {
294 goto error_put_subbuf;
295 }
296
ace0e591
JG
297 subbuf_view = lttng_buffer_view_init(
298 subbuf_addr, 0, padded_len);
1fdb9a78 299 read_len = lttng_consumer_on_read_subbuffer_mmap(ctx,
ace0e591 300 stream, &subbuf_view,
309167d2 301 padded_len - len, NULL);
07b86b52 302 /*
29decac3
DG
303 * We write the padded len in local tracefiles but the data len
304 * when using a relay. Display the error but continue processing
305 * to try to release the subbuffer.
07b86b52
JD
306 */
307 if (relayd_id != (uint64_t) -1ULL) {
308 if (read_len != len) {
309 ERR("Error sending to the relay (ret: %zd != len: %lu)",
310 read_len, len);
311 }
312 } else {
313 if (read_len != padded_len) {
314 ERR("Error writing to tracefile (ret: %zd != len: %lu)",
315 read_len, padded_len);
316 }
317 }
318
319 ret = kernctl_put_subbuf(stream->wait_fd);
320 if (ret < 0) {
321 ERR("Snapshot kernctl_put_subbuf");
322 goto end_unlock;
323 }
324 consumed_pos += stream->max_sb_size;
325 }
326
327 if (relayd_id == (uint64_t) -1ULL) {
fdf9986c
MD
328 if (stream->out_fd >= 0) {
329 ret = close(stream->out_fd);
330 if (ret < 0) {
331 PERROR("Kernel consumer snapshot close out_fd");
332 goto end_unlock;
333 }
334 stream->out_fd = -1;
07b86b52 335 }
07b86b52
JD
336 } else {
337 close_relayd_stream(stream);
6d40f8fa 338 stream->relayd_id = (uint64_t) -1ULL;
07b86b52
JD
339 }
340 pthread_mutex_unlock(&stream->lock);
341 }
342
343 /* All good! */
344 ret = 0;
345 goto end;
346
29decac3
DG
347error_put_subbuf:
348 ret = kernctl_put_subbuf(stream->wait_fd);
349 if (ret < 0) {
350 ERR("Snapshot kernctl_put_subbuf error path");
351 }
07b86b52
JD
352end_unlock:
353 pthread_mutex_unlock(&stream->lock);
354end:
355 rcu_read_unlock();
356 return ret;
357}
358
359/*
360 * Read the whole metadata available for a snapshot.
361 *
362 * Returns 0 on success, < 0 on error
363 */
a34de389 364static int lttng_kconsumer_snapshot_metadata(uint64_t key, char *path,
e2039c7a 365 uint64_t relayd_id, struct lttng_consumer_local_data *ctx)
07b86b52 366{
d771f832
DG
367 int ret, use_relayd = 0;
368 ssize_t ret_read;
07b86b52
JD
369 struct lttng_consumer_channel *metadata_channel;
370 struct lttng_consumer_stream *metadata_stream;
d771f832
DG
371
372 assert(ctx);
07b86b52
JD
373
374 DBG("Kernel consumer snapshot metadata with key %" PRIu64 " at path %s",
375 key, path);
376
377 rcu_read_lock();
378
379 metadata_channel = consumer_find_channel(key);
380 if (!metadata_channel) {
d771f832 381 ERR("Kernel snapshot metadata not found for key %" PRIu64, key);
07b86b52 382 ret = -1;
a34de389 383 goto error_no_channel;
07b86b52
JD
384 }
385
386 metadata_stream = metadata_channel->metadata_stream;
387 assert(metadata_stream);
a34de389 388 pthread_mutex_lock(&metadata_stream->lock);
07b86b52 389
d771f832 390 /* Flag once that we have a valid relayd for the stream. */
e2039c7a 391 if (relayd_id != (uint64_t) -1ULL) {
d771f832
DG
392 use_relayd = 1;
393 }
394
395 if (use_relayd) {
10a50311 396 ret = consumer_send_relayd_stream(metadata_stream, path);
e2039c7a 397 if (ret < 0) {
a34de389 398 goto error_snapshot;
e2039c7a 399 }
e2039c7a
JD
400 } else {
401 ret = utils_create_stream_file(path, metadata_stream->name,
402 metadata_stream->chan->tracefile_size,
403 metadata_stream->tracefile_count_current,
309167d2 404 metadata_stream->uid, metadata_stream->gid, NULL);
e2039c7a 405 if (ret < 0) {
a34de389 406 goto error_snapshot;
e2039c7a
JD
407 }
408 metadata_stream->out_fd = ret;
07b86b52 409 }
07b86b52 410
d771f832 411 do {
9ce5646a
MD
412 health_code_update();
413
d771f832
DG
414 ret_read = lttng_kconsumer_read_subbuffer(metadata_stream, ctx);
415 if (ret_read < 0) {
56591bac 416 if (ret_read != -EAGAIN) {
6a00837f 417 ERR("Kernel snapshot reading metadata subbuffer (ret: %zd)",
d771f832 418 ret_read);
a34de389
JG
419 ret = ret_read;
420 goto error_snapshot;
07b86b52 421 }
d771f832 422 /* ret_read is negative at this point so we will exit the loop. */
07b86b52
JD
423 continue;
424 }
d771f832 425 } while (ret_read >= 0);
07b86b52 426
d771f832
DG
427 if (use_relayd) {
428 close_relayd_stream(metadata_stream);
6d40f8fa 429 metadata_stream->relayd_id = (uint64_t) -1ULL;
d771f832 430 } else {
fdf9986c
MD
431 if (metadata_stream->out_fd >= 0) {
432 ret = close(metadata_stream->out_fd);
433 if (ret < 0) {
434 PERROR("Kernel consumer snapshot metadata close out_fd");
435 /*
436 * Don't go on error here since the snapshot was successful at this
437 * point but somehow the close failed.
438 */
439 }
440 metadata_stream->out_fd = -1;
e2039c7a 441 }
e2039c7a
JD
442 }
443
07b86b52 444 ret = 0;
a34de389
JG
445error_snapshot:
446 pthread_mutex_unlock(&metadata_stream->lock);
cf53a8a6
JD
447 cds_list_del(&metadata_stream->send_node);
448 consumer_stream_destroy(metadata_stream, NULL);
449 metadata_channel->metadata_stream = NULL;
a34de389 450error_no_channel:
07b86b52
JD
451 rcu_read_unlock();
452 return ret;
453}
454
1803a064
MD
455/*
456 * Receive command from session daemon and process it.
457 *
458 * Return 1 on success else a negative value or 0.
459 */
3bd1e081
MD
460int lttng_kconsumer_recv_cmd(struct lttng_consumer_local_data *ctx,
461 int sock, struct pollfd *consumer_sockpoll)
462{
463 ssize_t ret;
0c759fc9 464 enum lttcomm_return_code ret_code = LTTCOMM_CONSUMERD_SUCCESS;
3bd1e081
MD
465 struct lttcomm_consumer_msg msg;
466
9ce5646a
MD
467 health_code_update();
468
3bd1e081
MD
469 ret = lttcomm_recv_unix_sock(sock, &msg, sizeof(msg));
470 if (ret != sizeof(msg)) {
1803a064 471 if (ret > 0) {
c6857fcf 472 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_ERROR_RECV_CMD);
1803a064
MD
473 ret = -1;
474 }
3bd1e081
MD
475 return ret;
476 }
9ce5646a
MD
477
478 health_code_update();
479
84382d49
MD
480 /* Deprecated command */
481 assert(msg.cmd_type != LTTNG_CONSUMER_STOP);
3bd1e081 482
9ce5646a
MD
483 health_code_update();
484
b0b335c8
MD
485 /* relayd needs RCU read-side protection */
486 rcu_read_lock();
487
3bd1e081 488 switch (msg.cmd_type) {
00e2e675
DG
489 case LTTNG_CONSUMER_ADD_RELAYD_SOCKET:
490 {
f50f23d9 491 /* Session daemon status message are handled in the following call. */
028ba707 492 consumer_add_relayd_socket(msg.u.relayd_sock.net_index,
7735ef9e 493 msg.u.relayd_sock.type, ctx, sock, consumer_sockpoll,
d3e2ba59 494 &msg.u.relayd_sock.sock, msg.u.relayd_sock.session_id,
028ba707 495 msg.u.relayd_sock.relayd_session_id);
00e2e675
DG
496 goto end_nosignal;
497 }
3bd1e081
MD
498 case LTTNG_CONSUMER_ADD_CHANNEL:
499 {
500 struct lttng_consumer_channel *new_channel;
e43c41c5 501 int ret_recv;
3bd1e081 502
9ce5646a
MD
503 health_code_update();
504
f50f23d9
DG
505 /* First send a status message before receiving the fds. */
506 ret = consumer_send_status_msg(sock, ret_code);
507 if (ret < 0) {
508 /* Somehow, the session daemon is not responding anymore. */
1803a064 509 goto error_fatal;
f50f23d9 510 }
9ce5646a
MD
511
512 health_code_update();
513
d88aee68 514 DBG("consumer_add_channel %" PRIu64, msg.u.channel.channel_key);
3bd1e081 515 new_channel = consumer_allocate_channel(msg.u.channel.channel_key,
ffe60014
DG
516 msg.u.channel.session_id, msg.u.channel.pathname,
517 msg.u.channel.name, msg.u.channel.uid, msg.u.channel.gid,
1624d5b7
JD
518 msg.u.channel.relayd_id, msg.u.channel.output,
519 msg.u.channel.tracefile_size,
1950109e 520 msg.u.channel.tracefile_count, 0,
ecc48a90 521 msg.u.channel.monitor,
d7ba1388 522 msg.u.channel.live_timer_interval,
11785f65 523 msg.u.channel.is_live,
3d071855 524 NULL, NULL);
3bd1e081 525 if (new_channel == NULL) {
f73fabfd 526 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_OUTFD_ERROR);
3bd1e081
MD
527 goto end_nosignal;
528 }
ffe60014 529 new_channel->nb_init_stream_left = msg.u.channel.nb_init_streams;
95a1109b
JD
530 switch (msg.u.channel.output) {
531 case LTTNG_EVENT_SPLICE:
532 new_channel->output = CONSUMER_CHANNEL_SPLICE;
533 break;
534 case LTTNG_EVENT_MMAP:
535 new_channel->output = CONSUMER_CHANNEL_MMAP;
536 break;
537 default:
538 ERR("Channel output unknown %d", msg.u.channel.output);
539 goto end_nosignal;
540 }
ffe60014
DG
541
542 /* Translate and save channel type. */
543 switch (msg.u.channel.type) {
544 case CONSUMER_CHANNEL_TYPE_DATA:
545 case CONSUMER_CHANNEL_TYPE_METADATA:
546 new_channel->type = msg.u.channel.type;
547 break;
548 default:
549 assert(0);
550 goto end_nosignal;
551 };
552
9ce5646a
MD
553 health_code_update();
554
3bd1e081 555 if (ctx->on_recv_channel != NULL) {
e43c41c5
JD
556 ret_recv = ctx->on_recv_channel(new_channel);
557 if (ret_recv == 0) {
558 ret = consumer_add_channel(new_channel, ctx);
559 } else if (ret_recv < 0) {
3bd1e081
MD
560 goto end_nosignal;
561 }
562 } else {
e43c41c5 563 ret = consumer_add_channel(new_channel, ctx);
3bd1e081 564 }
94d49140
JD
565 if (CONSUMER_CHANNEL_TYPE_DATA) {
566 consumer_timer_live_start(new_channel,
567 msg.u.channel.live_timer_interval);
568 }
e43c41c5 569
9ce5646a
MD
570 health_code_update();
571
e43c41c5 572 /* If we received an error in add_channel, we need to report it. */
821fffb2 573 if (ret < 0) {
1803a064
MD
574 ret = consumer_send_status_msg(sock, ret);
575 if (ret < 0) {
576 goto error_fatal;
577 }
e43c41c5
JD
578 goto end_nosignal;
579 }
580
3bd1e081
MD
581 goto end_nosignal;
582 }
583 case LTTNG_CONSUMER_ADD_STREAM:
584 {
dae10966
DG
585 int fd;
586 struct lttng_pipe *stream_pipe;
00e2e675 587 struct lttng_consumer_stream *new_stream;
ffe60014 588 struct lttng_consumer_channel *channel;
c80048c6 589 int alloc_ret = 0;
3bd1e081 590
ffe60014
DG
591 /*
592 * Get stream's channel reference. Needed when adding the stream to the
593 * global hash table.
594 */
595 channel = consumer_find_channel(msg.u.stream.channel_key);
596 if (!channel) {
597 /*
598 * We could not find the channel. Can happen if cpu hotplug
599 * happens while tearing down.
600 */
d88aee68 601 ERR("Unable to find channel key %" PRIu64, msg.u.stream.channel_key);
e462382a 602 ret_code = LTTCOMM_CONSUMERD_CHAN_NOT_FOUND;
ffe60014
DG
603 }
604
9ce5646a
MD
605 health_code_update();
606
f50f23d9
DG
607 /* First send a status message before receiving the fds. */
608 ret = consumer_send_status_msg(sock, ret_code);
1803a064 609 if (ret < 0) {
d771f832 610 /* Somehow, the session daemon is not responding anymore. */
1803a064
MD
611 goto error_fatal;
612 }
9ce5646a
MD
613
614 health_code_update();
615
0c759fc9 616 if (ret_code != LTTCOMM_CONSUMERD_SUCCESS) {
d771f832 617 /* Channel was not found. */
f50f23d9
DG
618 goto end_nosignal;
619 }
620
d771f832 621 /* Blocking call */
9ce5646a
MD
622 health_poll_entry();
623 ret = lttng_consumer_poll_socket(consumer_sockpoll);
624 health_poll_exit();
84382d49
MD
625 if (ret) {
626 goto error_fatal;
3bd1e081 627 }
00e2e675 628
9ce5646a
MD
629 health_code_update();
630
00e2e675 631 /* Get stream file descriptor from socket */
f2fc6720
MD
632 ret = lttcomm_recv_fds_unix_sock(sock, &fd, 1);
633 if (ret != sizeof(fd)) {
f73fabfd 634 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_ERROR_RECV_FD);
3f8e211f 635 rcu_read_unlock();
3bd1e081
MD
636 return ret;
637 }
3bd1e081 638
9ce5646a
MD
639 health_code_update();
640
f50f23d9
DG
641 /*
642 * Send status code to session daemon only if the recv works. If the
643 * above recv() failed, the session daemon is notified through the
644 * error socket and the teardown is eventually done.
645 */
646 ret = consumer_send_status_msg(sock, ret_code);
647 if (ret < 0) {
648 /* Somehow, the session daemon is not responding anymore. */
649 goto end_nosignal;
650 }
651
9ce5646a
MD
652 health_code_update();
653
59db0d42
JG
654 pthread_mutex_lock(&channel->lock);
655 new_stream = consumer_allocate_stream(
656 channel,
657 channel->key,
ffe60014
DG
658 fd,
659 LTTNG_CONSUMER_ACTIVE_STREAM,
660 channel->name,
661 channel->uid,
662 channel->gid,
663 channel->relayd_id,
664 channel->session_id,
665 msg.u.stream.cpu,
666 &alloc_ret,
4891ece8
DG
667 channel->type,
668 channel->monitor);
3bd1e081 669 if (new_stream == NULL) {
c80048c6
MD
670 switch (alloc_ret) {
671 case -ENOMEM:
672 case -EINVAL:
673 default:
674 lttng_consumer_send_error(ctx, LTTCOMM_CONSUMERD_OUTFD_ERROR);
675 break;
c80048c6 676 }
59db0d42 677 pthread_mutex_unlock(&channel->lock);
3f8e211f 678 goto end_nosignal;
3bd1e081 679 }
d771f832 680
ffe60014 681 new_stream->wait_fd = fd;
07b86b52
JD
682 switch (channel->output) {
683 case CONSUMER_CHANNEL_SPLICE:
684 new_stream->output = LTTNG_EVENT_SPLICE;
a2361a61
JD
685 ret = utils_create_pipe(new_stream->splice_pipe);
686 if (ret < 0) {
687 goto end_nosignal;
688 }
07b86b52
JD
689 break;
690 case CONSUMER_CHANNEL_MMAP:
691 new_stream->output = LTTNG_EVENT_MMAP;
692 break;
693 default:
694 ERR("Stream output unknown %d", channel->output);
695 goto end_nosignal;
696 }
00e2e675 697
a0c83db9
DG
698 /*
699 * We've just assigned the channel to the stream so increment the
07b86b52
JD
700 * refcount right now. We don't need to increment the refcount for
701 * streams in no monitor because we handle manually the cleanup of
702 * those. It is very important to make sure there is NO prior
703 * consumer_del_stream() calls or else the refcount will be unbalanced.
a0c83db9 704 */
07b86b52
JD
705 if (channel->monitor) {
706 uatomic_inc(&new_stream->chan->refcount);
707 }
9d9353f9 708
fb3a43a9
DG
709 /*
710 * The buffer flush is done on the session daemon side for the kernel
711 * so no need for the stream "hangup_flush_done" variable to be
712 * tracked. This is important for a kernel stream since we don't rely
713 * on the flush state of the stream to read data. It's not the case for
714 * user space tracing.
715 */
716 new_stream->hangup_flush_done = 0;
717
9ce5646a
MD
718 health_code_update();
719
633d0084
DG
720 if (ctx->on_recv_stream) {
721 ret = ctx->on_recv_stream(new_stream);
722 if (ret < 0) {
d771f832 723 consumer_stream_free(new_stream);
633d0084 724 goto end_nosignal;
fb3a43a9 725 }
633d0084 726 }
fb3a43a9 727
9ce5646a
MD
728 health_code_update();
729
07b86b52
JD
730 if (new_stream->metadata_flag) {
731 channel->metadata_stream = new_stream;
732 }
733
2bba9e53
DG
734 /* Do not monitor this stream. */
735 if (!channel->monitor) {
5eecee74 736 DBG("Kernel consumer add stream %s in no monitor mode with "
6dc3064a 737 "relayd id %" PRIu64, new_stream->name,
6d40f8fa 738 new_stream->relayd_id);
10a50311 739 cds_list_add(&new_stream->send_node, &channel->streams.head);
59db0d42 740 pthread_mutex_unlock(&channel->lock);
6dc3064a
DG
741 break;
742 }
743
e1b71bdc 744 /* Send stream to relayd if the stream has an ID. */
6d40f8fa 745 if (new_stream->relayd_id != (uint64_t) -1ULL) {
194ee077
DG
746 ret = consumer_send_relayd_stream(new_stream,
747 new_stream->chan->pathname);
e1b71bdc 748 if (ret < 0) {
59db0d42 749 pthread_mutex_unlock(&channel->lock);
e1b71bdc
DG
750 consumer_stream_free(new_stream);
751 goto end_nosignal;
752 }
b7fa98e6
MD
753
754 /*
755 * If adding an extra stream to an already
756 * existing channel (e.g. cpu hotplug), we need
757 * to send the "streams_sent" command to relayd.
758 */
759 if (channel->streams_sent_to_relayd) {
760 ret = consumer_send_relayd_streams_sent(
6d40f8fa 761 new_stream->relayd_id);
b7fa98e6 762 if (ret < 0) {
59db0d42 763 pthread_mutex_unlock(&channel->lock);
b7fa98e6
MD
764 goto end_nosignal;
765 }
766 }
e2039c7a 767 }
59db0d42 768 pthread_mutex_unlock(&channel->lock);
e2039c7a 769
50f8ae69 770 /* Get the right pipe where the stream will be sent. */
633d0084 771 if (new_stream->metadata_flag) {
5ab66908
MD
772 ret = consumer_add_metadata_stream(new_stream);
773 if (ret) {
774 ERR("Consumer add metadata stream %" PRIu64 " failed. Continuing",
775 new_stream->key);
776 consumer_stream_free(new_stream);
777 goto end_nosignal;
778 }
dae10966 779 stream_pipe = ctx->consumer_metadata_pipe;
3bd1e081 780 } else {
5ab66908
MD
781 ret = consumer_add_data_stream(new_stream);
782 if (ret) {
783 ERR("Consumer add stream %" PRIu64 " failed. Continuing",
784 new_stream->key);
785 consumer_stream_free(new_stream);
786 goto end_nosignal;
787 }
dae10966 788 stream_pipe = ctx->consumer_data_pipe;
50f8ae69
DG
789 }
790
5ab66908
MD
791 /* Vitible to other threads */
792 new_stream->globally_visible = 1;
793
9ce5646a
MD
794 health_code_update();
795
dae10966 796 ret = lttng_pipe_write(stream_pipe, &new_stream, sizeof(new_stream));
50f8ae69 797 if (ret < 0) {
dae10966 798 ERR("Consumer write %s stream to pipe %d",
50f8ae69 799 new_stream->metadata_flag ? "metadata" : "data",
dae10966 800 lttng_pipe_get_writefd(stream_pipe));
5ab66908
MD
801 if (new_stream->metadata_flag) {
802 consumer_del_stream_for_metadata(new_stream);
803 } else {
804 consumer_del_stream_for_data(new_stream);
805 }
50f8ae69 806 goto end_nosignal;
3bd1e081 807 }
00e2e675 808
50f8ae69 809 DBG("Kernel consumer ADD_STREAM %s (fd: %d) with relayd id %" PRIu64,
ffe60014 810 new_stream->name, fd, new_stream->relayd_stream_id);
3bd1e081
MD
811 break;
812 }
a4baae1b
JD
813 case LTTNG_CONSUMER_STREAMS_SENT:
814 {
815 struct lttng_consumer_channel *channel;
816
817 /*
818 * Get stream's channel reference. Needed when adding the stream to the
819 * global hash table.
820 */
821 channel = consumer_find_channel(msg.u.sent_streams.channel_key);
822 if (!channel) {
823 /*
824 * We could not find the channel. Can happen if cpu hotplug
825 * happens while tearing down.
826 */
827 ERR("Unable to find channel key %" PRIu64,
828 msg.u.sent_streams.channel_key);
e462382a 829 ret_code = LTTCOMM_CONSUMERD_CHAN_NOT_FOUND;
a4baae1b
JD
830 }
831
832 health_code_update();
833
834 /*
835 * Send status code to session daemon.
836 */
837 ret = consumer_send_status_msg(sock, ret_code);
f261ad0a 838 if (ret < 0 || ret_code != LTTCOMM_CONSUMERD_SUCCESS) {
a4baae1b
JD
839 /* Somehow, the session daemon is not responding anymore. */
840 goto end_nosignal;
841 }
842
843 health_code_update();
844
845 /*
846 * We should not send this message if we don't monitor the
847 * streams in this channel.
848 */
849 if (!channel->monitor) {
850 break;
851 }
852
853 health_code_update();
854 /* Send stream to relayd if the stream has an ID. */
855 if (msg.u.sent_streams.net_seq_idx != (uint64_t) -1ULL) {
856 ret = consumer_send_relayd_streams_sent(
857 msg.u.sent_streams.net_seq_idx);
858 if (ret < 0) {
859 goto end_nosignal;
860 }
b7fa98e6 861 channel->streams_sent_to_relayd = true;
a4baae1b
JD
862 }
863 break;
864 }
3bd1e081
MD
865 case LTTNG_CONSUMER_UPDATE_STREAM:
866 {
3f8e211f
DG
867 rcu_read_unlock();
868 return -ENOSYS;
869 }
870 case LTTNG_CONSUMER_DESTROY_RELAYD:
871 {
a6ba4fe1 872 uint64_t index = msg.u.destroy_relayd.net_seq_idx;
3f8e211f
DG
873 struct consumer_relayd_sock_pair *relayd;
874
a6ba4fe1 875 DBG("Kernel consumer destroying relayd %" PRIu64, index);
3f8e211f
DG
876
877 /* Get relayd reference if exists. */
a6ba4fe1 878 relayd = consumer_find_relayd(index);
3f8e211f 879 if (relayd == NULL) {
3448e266 880 DBG("Unable to find relayd %" PRIu64, index);
e462382a 881 ret_code = LTTCOMM_CONSUMERD_RELAYD_FAIL;
3bd1e081 882 }
3f8e211f 883
a6ba4fe1
DG
884 /*
885 * Each relayd socket pair has a refcount of stream attached to it
886 * which tells if the relayd is still active or not depending on the
887 * refcount value.
888 *
889 * This will set the destroy flag of the relayd object and destroy it
890 * if the refcount reaches zero when called.
891 *
892 * The destroy can happen either here or when a stream fd hangs up.
893 */
f50f23d9
DG
894 if (relayd) {
895 consumer_flag_relayd_for_destroy(relayd);
896 }
897
9ce5646a
MD
898 health_code_update();
899
f50f23d9
DG
900 ret = consumer_send_status_msg(sock, ret_code);
901 if (ret < 0) {
902 /* Somehow, the session daemon is not responding anymore. */
1803a064 903 goto error_fatal;
f50f23d9 904 }
3f8e211f 905
3f8e211f 906 goto end_nosignal;
3bd1e081 907 }
6d805429 908 case LTTNG_CONSUMER_DATA_PENDING:
53632229 909 {
c8f59ee5 910 int32_t ret;
6d805429 911 uint64_t id = msg.u.data_pending.session_id;
c8f59ee5 912
6d805429 913 DBG("Kernel consumer data pending command for id %" PRIu64, id);
c8f59ee5 914
6d805429 915 ret = consumer_data_pending(id);
c8f59ee5 916
9ce5646a
MD
917 health_code_update();
918
c8f59ee5
DG
919 /* Send back returned value to session daemon */
920 ret = lttcomm_send_unix_sock(sock, &ret, sizeof(ret));
921 if (ret < 0) {
6d805429 922 PERROR("send data pending ret code");
1803a064 923 goto error_fatal;
c8f59ee5 924 }
f50f23d9
DG
925
926 /*
927 * No need to send back a status message since the data pending
928 * returned value is the response.
929 */
c8f59ee5 930 break;
53632229 931 }
6dc3064a
DG
932 case LTTNG_CONSUMER_SNAPSHOT_CHANNEL:
933 {
07b86b52
JD
934 if (msg.u.snapshot_channel.metadata == 1) {
935 ret = lttng_kconsumer_snapshot_metadata(msg.u.snapshot_channel.key,
e2039c7a
JD
936 msg.u.snapshot_channel.pathname,
937 msg.u.snapshot_channel.relayd_id, ctx);
07b86b52
JD
938 if (ret < 0) {
939 ERR("Snapshot metadata failed");
e462382a 940 ret_code = LTTCOMM_CONSUMERD_ERROR_METADATA;
07b86b52
JD
941 }
942 } else {
943 ret = lttng_kconsumer_snapshot_channel(msg.u.snapshot_channel.key,
944 msg.u.snapshot_channel.pathname,
5c786ded 945 msg.u.snapshot_channel.relayd_id,
d07ceecd 946 msg.u.snapshot_channel.nb_packets_per_stream,
5c786ded 947 ctx);
07b86b52
JD
948 if (ret < 0) {
949 ERR("Snapshot channel failed");
e462382a 950 ret_code = LTTCOMM_CONSUMERD_CHAN_NOT_FOUND;
07b86b52
JD
951 }
952 }
953
9ce5646a
MD
954 health_code_update();
955
6dc3064a
DG
956 ret = consumer_send_status_msg(sock, ret_code);
957 if (ret < 0) {
958 /* Somehow, the session daemon is not responding anymore. */
959 goto end_nosignal;
960 }
961 break;
962 }
07b86b52
JD
963 case LTTNG_CONSUMER_DESTROY_CHANNEL:
964 {
965 uint64_t key = msg.u.destroy_channel.key;
966 struct lttng_consumer_channel *channel;
967
968 channel = consumer_find_channel(key);
969 if (!channel) {
970 ERR("Kernel consumer destroy channel %" PRIu64 " not found", key);
e462382a 971 ret_code = LTTCOMM_CONSUMERD_CHAN_NOT_FOUND;
07b86b52
JD
972 }
973
9ce5646a
MD
974 health_code_update();
975
07b86b52
JD
976 ret = consumer_send_status_msg(sock, ret_code);
977 if (ret < 0) {
978 /* Somehow, the session daemon is not responding anymore. */
979 goto end_nosignal;
980 }
981
9ce5646a
MD
982 health_code_update();
983
15dc512a
DG
984 /* Stop right now if no channel was found. */
985 if (!channel) {
986 goto end_nosignal;
987 }
988
07b86b52
JD
989 /*
990 * This command should ONLY be issued for channel with streams set in
991 * no monitor mode.
992 */
993 assert(!channel->monitor);
994
995 /*
996 * The refcount should ALWAYS be 0 in the case of a channel in no
997 * monitor mode.
998 */
999 assert(!uatomic_sub_return(&channel->refcount, 1));
1000
1001 consumer_del_channel(channel);
1002
1003 goto end_nosignal;
1004 }
fb83fe64
JD
1005 case LTTNG_CONSUMER_DISCARDED_EVENTS:
1006 {
1007 uint64_t ret;
1008 struct lttng_consumer_channel *channel;
1009 uint64_t id = msg.u.discarded_events.session_id;
1010 uint64_t key = msg.u.discarded_events.channel_key;
1011
e5742757
MD
1012 DBG("Kernel consumer discarded events command for session id %"
1013 PRIu64 ", channel key %" PRIu64, id, key);
1014
fb83fe64
JD
1015 channel = consumer_find_channel(key);
1016 if (!channel) {
1017 ERR("Kernel consumer discarded events channel %"
1018 PRIu64 " not found", key);
e5742757
MD
1019 ret = 0;
1020 } else {
1021 ret = channel->discarded_events;
fb83fe64
JD
1022 }
1023
fb83fe64
JD
1024 health_code_update();
1025
1026 /* Send back returned value to session daemon */
1027 ret = lttcomm_send_unix_sock(sock, &ret, sizeof(ret));
1028 if (ret < 0) {
1029 PERROR("send discarded events");
1030 goto error_fatal;
1031 }
1032
1033 break;
1034 }
1035 case LTTNG_CONSUMER_LOST_PACKETS:
1036 {
1037 uint64_t ret;
1038 struct lttng_consumer_channel *channel;
1039 uint64_t id = msg.u.lost_packets.session_id;
1040 uint64_t key = msg.u.lost_packets.channel_key;
1041
e5742757
MD
1042 DBG("Kernel consumer lost packets command for session id %"
1043 PRIu64 ", channel key %" PRIu64, id, key);
1044
fb83fe64
JD
1045 channel = consumer_find_channel(key);
1046 if (!channel) {
1047 ERR("Kernel consumer lost packets channel %"
1048 PRIu64 " not found", key);
e5742757
MD
1049 ret = 0;
1050 } else {
1051 ret = channel->lost_packets;
fb83fe64
JD
1052 }
1053
fb83fe64
JD
1054 health_code_update();
1055
1056 /* Send back returned value to session daemon */
1057 ret = lttcomm_send_unix_sock(sock, &ret, sizeof(ret));
1058 if (ret < 0) {
1059 PERROR("send lost packets");
1060 goto error_fatal;
1061 }
1062
1063 break;
1064 }
3bd1e081 1065 default:
3f8e211f 1066 goto end_nosignal;
3bd1e081 1067 }
3f8e211f 1068
3bd1e081 1069end_nosignal:
b0b335c8 1070 rcu_read_unlock();
4cbc1a04
DG
1071
1072 /*
1073 * Return 1 to indicate success since the 0 value can be a socket
1074 * shutdown during the recv() or send() call.
1075 */
9ce5646a 1076 health_code_update();
4cbc1a04 1077 return 1;
1803a064
MD
1078
1079error_fatal:
1080 rcu_read_unlock();
1081 /* This will issue a consumer stop. */
1082 return -1;
3bd1e081 1083}
d41f73b7 1084
309167d2
JD
1085/*
1086 * Populate index values of a kernel stream. Values are set in big endian order.
1087 *
1088 * Return 0 on success or else a negative value.
1089 */
50adc264 1090static int get_index_values(struct ctf_packet_index *index, int infd)
309167d2
JD
1091{
1092 int ret;
1093
1094 ret = kernctl_get_timestamp_begin(infd, &index->timestamp_begin);
1095 if (ret < 0) {
1096 PERROR("kernctl_get_timestamp_begin");
1097 goto error;
1098 }
1099 index->timestamp_begin = htobe64(index->timestamp_begin);
1100
1101 ret = kernctl_get_timestamp_end(infd, &index->timestamp_end);
1102 if (ret < 0) {
1103 PERROR("kernctl_get_timestamp_end");
1104 goto error;
1105 }
1106 index->timestamp_end = htobe64(index->timestamp_end);
1107
1108 ret = kernctl_get_events_discarded(infd, &index->events_discarded);
1109 if (ret < 0) {
1110 PERROR("kernctl_get_events_discarded");
1111 goto error;
1112 }
1113 index->events_discarded = htobe64(index->events_discarded);
1114
1115 ret = kernctl_get_content_size(infd, &index->content_size);
1116 if (ret < 0) {
1117 PERROR("kernctl_get_content_size");
1118 goto error;
1119 }
1120 index->content_size = htobe64(index->content_size);
1121
1122 ret = kernctl_get_packet_size(infd, &index->packet_size);
1123 if (ret < 0) {
1124 PERROR("kernctl_get_packet_size");
1125 goto error;
1126 }
1127 index->packet_size = htobe64(index->packet_size);
1128
1129 ret = kernctl_get_stream_id(infd, &index->stream_id);
1130 if (ret < 0) {
1131 PERROR("kernctl_get_stream_id");
1132 goto error;
1133 }
1134 index->stream_id = htobe64(index->stream_id);
1135
234cd636
JD
1136 ret = kernctl_get_instance_id(infd, &index->stream_instance_id);
1137 if (ret < 0) {
f0b03c22
MD
1138 if (ret == -ENOTTY) {
1139 /* Command not implemented by lttng-modules. */
1140 index->stream_instance_id = -1ULL;
1141 ret = 0;
1142 } else {
1143 PERROR("kernctl_get_instance_id");
1144 goto error;
1145 }
234cd636
JD
1146 }
1147 index->stream_instance_id = htobe64(index->stream_instance_id);
1148
1149 ret = kernctl_get_sequence_number(infd, &index->packet_seq_num);
1150 if (ret < 0) {
f0b03c22
MD
1151 if (ret == -ENOTTY) {
1152 /* Command not implemented by lttng-modules. */
1153 index->packet_seq_num = -1ULL;
1154 ret = 0;
1155 } else {
1156 PERROR("kernctl_get_sequence_number");
1157 goto error;
1158 }
234cd636
JD
1159 }
1160 index->packet_seq_num = htobe64(index->packet_seq_num);
1161
309167d2
JD
1162error:
1163 return ret;
1164}
94d49140
JD
1165/*
1166 * Sync metadata meaning request them to the session daemon and snapshot to the
1167 * metadata thread can consumer them.
1168 *
1169 * Metadata stream lock MUST be acquired.
1170 *
1171 * Return 0 if new metadatda is available, EAGAIN if the metadata stream
1172 * is empty or a negative value on error.
1173 */
1174int lttng_kconsumer_sync_metadata(struct lttng_consumer_stream *metadata)
1175{
1176 int ret;
1177
1178 assert(metadata);
1179
1180 ret = kernctl_buffer_flush(metadata->wait_fd);
1181 if (ret < 0) {
1182 ERR("Failed to flush kernel stream");
1183 goto end;
1184 }
1185
1186 ret = kernctl_snapshot(metadata->wait_fd);
1187 if (ret < 0) {
32af2c95 1188 if (ret != -EAGAIN) {
94d49140
JD
1189 ERR("Sync metadata, taking kernel snapshot failed.");
1190 goto end;
1191 }
1192 DBG("Sync metadata, no new kernel metadata");
1193 /* No new metadata, exit. */
1194 ret = ENODATA;
1195 goto end;
1196 }
1197
1198end:
1199 return ret;
1200}
309167d2 1201
fb83fe64
JD
1202static
1203int update_stream_stats(struct lttng_consumer_stream *stream)
1204{
1205 int ret;
1206 uint64_t seq, discarded;
1207
1208 ret = kernctl_get_sequence_number(stream->wait_fd, &seq);
1209 if (ret < 0) {
f0b03c22
MD
1210 if (ret == -ENOTTY) {
1211 /* Command not implemented by lttng-modules. */
1212 seq = -1ULL;
1213 ret = 0;
1214 } else {
1215 PERROR("kernctl_get_sequence_number");
1216 goto end;
1217 }
fb83fe64
JD
1218 }
1219
1220 /*
1221 * Start the sequence when we extract the first packet in case we don't
1222 * start at 0 (for example if a consumer is not connected to the
1223 * session immediately after the beginning).
1224 */
1225 if (stream->last_sequence_number == -1ULL) {
1226 stream->last_sequence_number = seq;
1227 } else if (seq > stream->last_sequence_number) {
1228 stream->chan->lost_packets += seq -
1229 stream->last_sequence_number - 1;
1230 } else {
1231 /* seq <= last_sequence_number */
1232 ERR("Sequence number inconsistent : prev = %" PRIu64
1233 ", current = %" PRIu64,
1234 stream->last_sequence_number, seq);
1235 ret = -1;
1236 goto end;
1237 }
1238 stream->last_sequence_number = seq;
1239
1240 ret = kernctl_get_events_discarded(stream->wait_fd, &discarded);
1241 if (ret < 0) {
1242 PERROR("kernctl_get_events_discarded");
1243 goto end;
1244 }
1245 if (discarded < stream->last_discarded_events) {
1246 /*
83f4233d
MJ
1247 * Overflow has occurred. We assume only one wrap-around
1248 * has occurred.
fb83fe64
JD
1249 */
1250 stream->chan->discarded_events += (1ULL << (CAA_BITS_PER_LONG - 1)) -
1251 stream->last_discarded_events + discarded;
1252 } else {
1253 stream->chan->discarded_events += discarded -
1254 stream->last_discarded_events;
1255 }
1256 stream->last_discarded_events = discarded;
1257 ret = 0;
1258
1259end:
1260 return ret;
1261}
1262
93ec662e
JD
1263/*
1264 * Check if the local version of the metadata stream matches with the version
1265 * of the metadata stream in the kernel. If it was updated, set the reset flag
1266 * on the stream.
1267 */
1268static
1269int metadata_stream_check_version(int infd, struct lttng_consumer_stream *stream)
1270{
1271 int ret;
1272 uint64_t cur_version;
1273
1274 ret = kernctl_get_metadata_version(infd, &cur_version);
1275 if (ret < 0) {
f0b03c22
MD
1276 if (ret == -ENOTTY) {
1277 /*
1278 * LTTng-modules does not implement this
1279 * command.
1280 */
1281 ret = 0;
1282 goto end;
1283 }
93ec662e
JD
1284 ERR("Failed to get the metadata version");
1285 goto end;
1286 }
1287
1288 if (stream->metadata_version == cur_version) {
1289 ret = 0;
1290 goto end;
1291 }
1292
1293 DBG("New metadata version detected");
1294 stream->metadata_version = cur_version;
1295 stream->reset_metadata_flag = 1;
1296 ret = 0;
1297
1298end:
1299 return ret;
1300}
1301
d41f73b7
MD
1302/*
1303 * Consume data on a file descriptor and write it on a trace file.
1304 */
4078b776 1305ssize_t lttng_kconsumer_read_subbuffer(struct lttng_consumer_stream *stream,
d41f73b7
MD
1306 struct lttng_consumer_local_data *ctx)
1307{
1d4dfdef 1308 unsigned long len, subbuf_size, padding;
1c20f0e2 1309 int err, write_index = 1;
4078b776 1310 ssize_t ret = 0;
d41f73b7 1311 int infd = stream->wait_fd;
50adc264 1312 struct ctf_packet_index index;
d41f73b7
MD
1313
1314 DBG("In read_subbuffer (infd : %d)", infd);
309167d2 1315
d41f73b7
MD
1316 /* Get the next subbuffer */
1317 err = kernctl_get_next_subbuf(infd);
1318 if (err != 0) {
d41f73b7
MD
1319 /*
1320 * This is a debug message even for single-threaded consumer,
1321 * because poll() have more relaxed criterions than get subbuf,
1322 * so get_subbuf may fail for short race windows where poll()
1323 * would issue wakeups.
1324 */
1325 DBG("Reserving sub buffer failed (everything is normal, "
1326 "it is due to concurrency)");
32af2c95 1327 ret = err;
d41f73b7
MD
1328 goto end;
1329 }
1330
1d4dfdef
DG
1331 /* Get the full subbuffer size including padding */
1332 err = kernctl_get_padded_subbuf_size(infd, &len);
1333 if (err != 0) {
5a510c9f 1334 PERROR("Getting sub-buffer len failed.");
8265f19e
MD
1335 err = kernctl_put_subbuf(infd);
1336 if (err != 0) {
32af2c95 1337 if (err == -EFAULT) {
5a510c9f 1338 PERROR("Error in unreserving sub buffer\n");
32af2c95 1339 } else if (err == -EIO) {
8265f19e 1340 /* Should never happen with newer LTTng versions */
5a510c9f 1341 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
8265f19e 1342 }
32af2c95 1343 ret = err;
8265f19e
MD
1344 goto end;
1345 }
32af2c95 1346 ret = err;
1d4dfdef
DG
1347 goto end;
1348 }
1349
1c20f0e2 1350 if (!stream->metadata_flag) {
309167d2
JD
1351 ret = get_index_values(&index, infd);
1352 if (ret < 0) {
8265f19e
MD
1353 err = kernctl_put_subbuf(infd);
1354 if (err != 0) {
32af2c95 1355 if (err == -EFAULT) {
5a510c9f 1356 PERROR("Error in unreserving sub buffer\n");
32af2c95 1357 } else if (err == -EIO) {
8265f19e 1358 /* Should never happen with newer LTTng versions */
5a510c9f 1359 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
8265f19e 1360 }
32af2c95 1361 ret = err;
8265f19e
MD
1362 goto end;
1363 }
309167d2
JD
1364 goto end;
1365 }
fb83fe64
JD
1366 ret = update_stream_stats(stream);
1367 if (ret < 0) {
becac7c4
MD
1368 err = kernctl_put_subbuf(infd);
1369 if (err != 0) {
1370 if (err == -EFAULT) {
1371 PERROR("Error in unreserving sub buffer\n");
1372 } else if (err == -EIO) {
1373 /* Should never happen with newer LTTng versions */
1374 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
1375 }
1376 ret = err;
1377 goto end;
1378 }
fb83fe64
JD
1379 goto end;
1380 }
1c20f0e2
JD
1381 } else {
1382 write_index = 0;
93ec662e
JD
1383 ret = metadata_stream_check_version(infd, stream);
1384 if (ret < 0) {
becac7c4
MD
1385 err = kernctl_put_subbuf(infd);
1386 if (err != 0) {
1387 if (err == -EFAULT) {
1388 PERROR("Error in unreserving sub buffer\n");
1389 } else if (err == -EIO) {
1390 /* Should never happen with newer LTTng versions */
1391 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
1392 }
1393 ret = err;
1394 goto end;
1395 }
93ec662e
JD
1396 goto end;
1397 }
309167d2
JD
1398 }
1399
ffe60014 1400 switch (stream->chan->output) {
07b86b52 1401 case CONSUMER_CHANNEL_SPLICE:
1d4dfdef
DG
1402 /*
1403 * XXX: The lttng-modules splice "actor" does not handle copying
1404 * partial pages hence only using the subbuffer size without the
1405 * padding makes the splice fail.
1406 */
1407 subbuf_size = len;
1408 padding = 0;
1409
1410 /* splice the subbuffer to the tracefile */
91dfef6e 1411 ret = lttng_consumer_on_read_subbuffer_splice(ctx, stream, subbuf_size,
309167d2 1412 padding, &index);
91dfef6e
DG
1413 /*
1414 * XXX: Splice does not support network streaming so the return value
1415 * is simply checked against subbuf_size and not like the mmap() op.
1416 */
1d4dfdef
DG
1417 if (ret != subbuf_size) {
1418 /*
1419 * display the error but continue processing to try
1420 * to release the subbuffer
1421 */
1422 ERR("Error splicing to tracefile (ret: %zd != len: %lu)",
1423 ret, subbuf_size);
309167d2 1424 write_index = 0;
1d4dfdef
DG
1425 }
1426 break;
07b86b52 1427 case CONSUMER_CHANNEL_MMAP:
1fdb9a78
JG
1428 {
1429 const char *subbuf_addr;
ace0e591 1430 struct lttng_buffer_view subbuf_view;
1fdb9a78 1431
1d4dfdef
DG
1432 /* Get subbuffer size without padding */
1433 err = kernctl_get_subbuf_size(infd, &subbuf_size);
1434 if (err != 0) {
5a510c9f 1435 PERROR("Getting sub-buffer len failed.");
8265f19e
MD
1436 err = kernctl_put_subbuf(infd);
1437 if (err != 0) {
32af2c95 1438 if (err == -EFAULT) {
5a510c9f 1439 PERROR("Error in unreserving sub buffer\n");
32af2c95 1440 } else if (err == -EIO) {
8265f19e 1441 /* Should never happen with newer LTTng versions */
5a510c9f 1442 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
8265f19e 1443 }
32af2c95 1444 ret = err;
8265f19e
MD
1445 goto end;
1446 }
32af2c95 1447 ret = err;
1d4dfdef
DG
1448 goto end;
1449 }
47e81c02 1450
1fdb9a78
JG
1451 ret = get_current_subbuf_addr(stream, &subbuf_addr);
1452 if (ret) {
1453 goto error_put_subbuf;
1454 }
1455
1d4dfdef
DG
1456 /* Make sure the tracer is not gone mad on us! */
1457 assert(len >= subbuf_size);
1458
1459 padding = len - subbuf_size;
1460
ace0e591
JG
1461 subbuf_view = lttng_buffer_view_init(subbuf_addr, 0, len);
1462
1d4dfdef 1463 /* write the subbuffer to the tracefile */
ace0e591
JG
1464 ret = lttng_consumer_on_read_subbuffer_mmap(
1465 ctx, stream, &subbuf_view, padding, &index);
91dfef6e 1466 /*
ace0e591
JG
1467 * The mmap operation should write subbuf_size amount of data
1468 * when network streaming or the full padding (len) size when we
1469 * are _not_ streaming.
91dfef6e 1470 */
6d40f8fa
JG
1471 if ((ret != subbuf_size && stream->relayd_id != (uint64_t) -1ULL) ||
1472 (ret != len && stream->relayd_id == (uint64_t) -1ULL)) {
1d4dfdef 1473 /*
91dfef6e 1474 * Display the error but continue processing to try to release the
2336629e
DG
1475 * subbuffer. This is a DBG statement since this is possible to
1476 * happen without being a critical error.
1d4dfdef 1477 */
2336629e 1478 DBG("Error writing to tracefile "
91dfef6e
DG
1479 "(ret: %zd != len: %lu != subbuf_size: %lu)",
1480 ret, len, subbuf_size);
309167d2 1481 write_index = 0;
1d4dfdef
DG
1482 }
1483 break;
1fdb9a78 1484 }
1d4dfdef
DG
1485 default:
1486 ERR("Unknown output method");
56591bac 1487 ret = -EPERM;
d41f73b7 1488 }
1fdb9a78 1489error_put_subbuf:
d41f73b7
MD
1490 err = kernctl_put_next_subbuf(infd);
1491 if (err != 0) {
32af2c95 1492 if (err == -EFAULT) {
5a510c9f 1493 PERROR("Error in unreserving sub buffer\n");
32af2c95 1494 } else if (err == -EIO) {
d41f73b7 1495 /* Should never happen with newer LTTng versions */
5a510c9f 1496 PERROR("Reader has been pushed by the writer, last sub-buffer corrupted.");
d41f73b7 1497 }
32af2c95 1498 ret = err;
d41f73b7
MD
1499 goto end;
1500 }
1501
309167d2 1502 /* Write index if needed. */
1c20f0e2
JD
1503 if (!write_index) {
1504 goto end;
1505 }
1506
94d49140
JD
1507 if (stream->chan->live_timer_interval && !stream->metadata_flag) {
1508 /*
1509 * In live, block until all the metadata is sent.
1510 */
c585821b
MD
1511 pthread_mutex_lock(&stream->metadata_timer_lock);
1512 assert(!stream->missed_metadata_flush);
1513 stream->waiting_on_metadata = true;
1514 pthread_mutex_unlock(&stream->metadata_timer_lock);
1515
94d49140 1516 err = consumer_stream_sync_metadata(ctx, stream->session_id);
c585821b
MD
1517
1518 pthread_mutex_lock(&stream->metadata_timer_lock);
1519 stream->waiting_on_metadata = false;
1520 if (stream->missed_metadata_flush) {
1521 stream->missed_metadata_flush = false;
1522 pthread_mutex_unlock(&stream->metadata_timer_lock);
1523 (void) consumer_flush_kernel_index(stream);
1524 } else {
1525 pthread_mutex_unlock(&stream->metadata_timer_lock);
1526 }
94d49140
JD
1527 if (err < 0) {
1528 goto end;
1529 }
1530 }
1531
1c20f0e2
JD
1532 err = consumer_stream_write_index(stream, &index);
1533 if (err < 0) {
1534 goto end;
309167d2
JD
1535 }
1536
d41f73b7
MD
1537end:
1538 return ret;
1539}
1540
1541int lttng_kconsumer_on_recv_stream(struct lttng_consumer_stream *stream)
1542{
1543 int ret;
ffe60014
DG
1544
1545 assert(stream);
1546
2bba9e53
DG
1547 /*
1548 * Don't create anything if this is set for streaming or should not be
1549 * monitored.
1550 */
6d40f8fa 1551 if (stream->relayd_id == (uint64_t) -1ULL && stream->chan->monitor) {
fe4477ee
JD
1552 ret = utils_create_stream_file(stream->chan->pathname, stream->name,
1553 stream->chan->tracefile_size, stream->tracefile_count_current,
309167d2 1554 stream->uid, stream->gid, NULL);
fe4477ee
JD
1555 if (ret < 0) {
1556 goto error;
1557 }
1558 stream->out_fd = ret;
1559 stream->tracefile_size_current = 0;
309167d2
JD
1560
1561 if (!stream->metadata_flag) {
e0547b83
MD
1562 struct lttng_index_file *index_file;
1563
1564 index_file = lttng_index_file_create(stream->chan->pathname,
309167d2
JD
1565 stream->name, stream->uid, stream->gid,
1566 stream->chan->tracefile_size,
e0547b83
MD
1567 stream->tracefile_count_current,
1568 CTF_INDEX_MAJOR, CTF_INDEX_MINOR);
1569 if (!index_file) {
309167d2
JD
1570 goto error;
1571 }
e0547b83 1572 stream->index_file = index_file;
309167d2 1573 }
ffe60014 1574 }
d41f73b7 1575
d41f73b7
MD
1576 if (stream->output == LTTNG_EVENT_MMAP) {
1577 /* get the len of the mmap region */
1578 unsigned long mmap_len;
1579
1580 ret = kernctl_get_mmap_len(stream->wait_fd, &mmap_len);
1581 if (ret != 0) {
ffe60014 1582 PERROR("kernctl_get_mmap_len");
d41f73b7
MD
1583 goto error_close_fd;
1584 }
1585 stream->mmap_len = (size_t) mmap_len;
1586
ffe60014
DG
1587 stream->mmap_base = mmap(NULL, stream->mmap_len, PROT_READ,
1588 MAP_PRIVATE, stream->wait_fd, 0);
d41f73b7 1589 if (stream->mmap_base == MAP_FAILED) {
ffe60014 1590 PERROR("Error mmaping");
d41f73b7
MD
1591 ret = -1;
1592 goto error_close_fd;
1593 }
1594 }
1595
1596 /* we return 0 to let the library handle the FD internally */
1597 return 0;
1598
1599error_close_fd:
2f225ce2 1600 if (stream->out_fd >= 0) {
d41f73b7
MD
1601 int err;
1602
1603 err = close(stream->out_fd);
1604 assert(!err);
2f225ce2 1605 stream->out_fd = -1;
d41f73b7
MD
1606 }
1607error:
1608 return ret;
1609}
1610
ca22feea
DG
1611/*
1612 * Check if data is still being extracted from the buffers for a specific
4e9a4686
DG
1613 * stream. Consumer data lock MUST be acquired before calling this function
1614 * and the stream lock.
ca22feea 1615 *
6d805429 1616 * Return 1 if the traced data are still getting read else 0 meaning that the
ca22feea
DG
1617 * data is available for trace viewer reading.
1618 */
6d805429 1619int lttng_kconsumer_data_pending(struct lttng_consumer_stream *stream)
ca22feea
DG
1620{
1621 int ret;
1622
1623 assert(stream);
1624
873b9e9a
MD
1625 if (stream->endpoint_status != CONSUMER_ENDPOINT_ACTIVE) {
1626 ret = 0;
1627 goto end;
1628 }
1629
ca22feea
DG
1630 ret = kernctl_get_next_subbuf(stream->wait_fd);
1631 if (ret == 0) {
1632 /* There is still data so let's put back this subbuffer. */
1633 ret = kernctl_put_subbuf(stream->wait_fd);
1634 assert(ret == 0);
6d805429 1635 ret = 1; /* Data is pending */
4e9a4686 1636 goto end;
ca22feea
DG
1637 }
1638
6d805429
DG
1639 /* Data is NOT pending and ready to be read. */
1640 ret = 0;
ca22feea 1641
6efae65e
DG
1642end:
1643 return ret;
ca22feea 1644}
This page took 0.158712 seconds and 5 git commands to generate.