Commit | Line | Data |
---|---|---|
e98a2d6e | 1 | /* |
0235b0db | 2 | * SPDX-License-Identifier: MIT |
e98a2d6e | 3 | * |
0235b0db MJ |
4 | * Copyright 2016-2017 Philippe Proulx <pproulx@efficios.com> |
5 | * Copyright 2016 Jérémie Galarneau <jeremie.galarneau@efficios.com> | |
6 | * Copyright 2010-2011 EfficiOS Inc. and Linux Foundation | |
e98a2d6e PP |
7 | */ |
8 | ||
c802cacb | 9 | #include <glib.h> |
c802cacb SM |
10 | #include <stdint.h> |
11 | #include <stdio.h> | |
c802cacb | 12 | |
83ad336c | 13 | #include "compat/endian.h" /* IWYU pragma: keep */ |
0f5c5d5c | 14 | #include "compat/mman.h" /* IWYU: pragma keep */ |
2cef6403 | 15 | #include "cpp-common/bt2s/make-unique.hpp" |
0f5c5d5c | 16 | #include "cpp-common/vendor/fmt/format.h" |
c802cacb | 17 | |
5656cea5 | 18 | #include "../common/src/msg-iter/msg-iter.hpp" |
087cd0f5 | 19 | #include "data-stream-file.hpp" |
c802cacb | 20 | #include "file.hpp" |
c7e1be4b SM |
21 | #include "fs.hpp" |
22 | #include "lttng-index.hpp" | |
e98a2d6e | 23 | |
4164020e | 24 | static inline size_t remaining_mmap_bytes(struct ctf_fs_ds_file *ds_file) |
e98a2d6e | 25 | { |
4164020e SM |
26 | BT_ASSERT_DBG(ds_file->mmap_len >= ds_file->request_offset_in_mapping); |
27 | return ds_file->mmap_len - ds_file->request_offset_in_mapping; | |
e98a2d6e PP |
28 | } |
29 | ||
127e2341 SM |
30 | /* |
31 | * Return true if `offset_in_file` is in the current mapping. | |
32 | */ | |
33 | ||
4164020e | 34 | static bool offset_ist_mapped(struct ctf_fs_ds_file *ds_file, off_t offset_in_file) |
127e2341 | 35 | { |
4164020e SM |
36 | return offset_in_file >= ds_file->mmap_offset_in_file && |
37 | offset_in_file < (ds_file->mmap_offset_in_file + ds_file->mmap_len); | |
127e2341 SM |
38 | } |
39 | ||
4164020e | 40 | static enum ctf_msg_iter_medium_status ds_file_munmap(struct ctf_fs_ds_file *ds_file) |
e98a2d6e | 41 | { |
4164020e | 42 | enum ctf_msg_iter_medium_status status; |
4164020e SM |
43 | |
44 | BT_ASSERT(ds_file); | |
45 | ||
46 | if (!ds_file->mmap_addr) { | |
47 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
48 | goto end; | |
49 | } | |
50 | ||
51 | if (bt_munmap(ds_file->mmap_addr, ds_file->mmap_len)) { | |
0f5c5d5c SM |
52 | BT_CPPLOGE_ERRNO_SPEC(ds_file->logger, "Cannot memory-unmap file", |
53 | ": address={}, size={}, file_path=\"{}\", file={}", | |
54 | fmt::ptr(ds_file->mmap_addr), ds_file->mmap_len, | |
a39d9817 | 55 | ds_file->file ? ds_file->file->path : "NULL", |
0f5c5d5c | 56 | ds_file->file ? fmt::ptr(ds_file->file->fp) : NULL); |
4164020e SM |
57 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
58 | goto end; | |
59 | } | |
60 | ||
61 | ds_file->mmap_addr = NULL; | |
62 | ||
63 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
fc9a526c | 64 | end: |
4164020e | 65 | return status; |
e98a2d6e PP |
66 | } |
67 | ||
127e2341 SM |
68 | /* |
69 | * mmap a region of `ds_file` such that `requested_offset_in_file` is in the | |
70 | * mapping. If the currently mmap-ed region already contains | |
71 | * `requested_offset_in_file`, the mapping is kept. | |
72 | * | |
f6e68e70 SM |
73 | * Set `ds_file->requested_offset_in_mapping` based on `request_offset_in_file`, |
74 | * such that the next call to `request_bytes` will return bytes starting at that | |
75 | * position. | |
127e2341 SM |
76 | * |
77 | * `requested_offset_in_file` must be a valid offset in the file. | |
78 | */ | |
4164020e SM |
79 | static enum ctf_msg_iter_medium_status ds_file_mmap(struct ctf_fs_ds_file *ds_file, |
80 | off_t requested_offset_in_file) | |
e98a2d6e | 81 | { |
4164020e | 82 | enum ctf_msg_iter_medium_status status; |
4164020e SM |
83 | |
84 | /* Ensure the requested offset is in the file range. */ | |
85 | BT_ASSERT(requested_offset_in_file >= 0); | |
86 | BT_ASSERT(requested_offset_in_file < ds_file->file->size); | |
87 | ||
88 | /* | |
89 | * If the mapping already contains the requested offset, just adjust | |
90 | * requested_offset_in_mapping. | |
91 | */ | |
92 | if (offset_ist_mapped(ds_file, requested_offset_in_file)) { | |
93 | ds_file->request_offset_in_mapping = | |
94 | requested_offset_in_file - ds_file->mmap_offset_in_file; | |
95 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
96 | goto end; | |
97 | } | |
98 | ||
99 | /* Unmap old region */ | |
100 | status = ds_file_munmap(ds_file); | |
101 | if (status != CTF_MSG_ITER_MEDIUM_STATUS_OK) { | |
102 | goto end; | |
103 | } | |
104 | ||
105 | /* | |
106 | * Compute a mapping that has the required alignment properties and | |
107 | * contains `requested_offset_in_file`. | |
108 | */ | |
109 | ds_file->request_offset_in_mapping = | |
0f5c5d5c SM |
110 | requested_offset_in_file % |
111 | bt_mmap_get_offset_align_size(static_cast<int>(ds_file->logger.level())); | |
4164020e SM |
112 | ds_file->mmap_offset_in_file = requested_offset_in_file - ds_file->request_offset_in_mapping; |
113 | ds_file->mmap_len = | |
114 | MIN(ds_file->file->size - ds_file->mmap_offset_in_file, ds_file->mmap_max_len); | |
115 | ||
116 | BT_ASSERT(ds_file->mmap_len > 0); | |
117 | ||
118 | ds_file->mmap_addr = | |
85a25425 | 119 | bt_mmap(ds_file->mmap_len, PROT_READ, MAP_PRIVATE, fileno(ds_file->file->fp.get()), |
0f5c5d5c | 120 | ds_file->mmap_offset_in_file, static_cast<int>(ds_file->logger.level())); |
4164020e | 121 | if (ds_file->mmap_addr == MAP_FAILED) { |
0f5c5d5c SM |
122 | BT_CPPLOGE_SPEC(ds_file->logger, |
123 | "Cannot memory-map address (size {}) of file \"{}\" ({}) at offset {}: {}", | |
a39d9817 | 124 | ds_file->mmap_len, ds_file->file->path, fmt::ptr(ds_file->file->fp), |
0f5c5d5c | 125 | (intmax_t) ds_file->mmap_offset_in_file, strerror(errno)); |
4164020e SM |
126 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
127 | goto end; | |
128 | } | |
129 | ||
130 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
127e2341 SM |
131 | |
132 | end: | |
4164020e | 133 | return status; |
127e2341 SM |
134 | } |
135 | ||
136 | /* | |
137 | * Change the mapping of the file to read the region that follows the current | |
138 | * mapping. | |
139 | * | |
140 | * If the file hasn't been mapped yet, then everything (mmap_offset_in_file, | |
141 | * mmap_len, request_offset_in_mapping) should have the value 0, which will | |
142 | * result in the beginning of the file getting mapped. | |
143 | * | |
144 | * return _EOF if the current mapping is the end of the file. | |
145 | */ | |
146 | ||
4164020e | 147 | static enum ctf_msg_iter_medium_status ds_file_mmap_next(struct ctf_fs_ds_file *ds_file) |
127e2341 | 148 | { |
4164020e SM |
149 | enum ctf_msg_iter_medium_status status; |
150 | ||
151 | /* | |
152 | * If we're called, it's because more bytes are requested but we have | |
153 | * given all the bytes of the current mapping. | |
154 | */ | |
155 | BT_ASSERT(ds_file->request_offset_in_mapping == ds_file->mmap_len); | |
156 | ||
157 | /* | |
158 | * If the current mapping coincides with the end of the file, there is | |
159 | * no next mapping. | |
160 | */ | |
161 | if (ds_file->mmap_offset_in_file + ds_file->mmap_len == ds_file->file->size) { | |
162 | status = CTF_MSG_ITER_MEDIUM_STATUS_EOF; | |
163 | goto end; | |
164 | } | |
165 | ||
166 | status = ds_file_mmap(ds_file, ds_file->mmap_offset_in_file + ds_file->mmap_len); | |
127e2341 | 167 | |
e98a2d6e | 168 | end: |
4164020e | 169 | return status; |
e98a2d6e PP |
170 | } |
171 | ||
4164020e SM |
172 | static enum ctf_msg_iter_medium_status medop_request_bytes(size_t request_sz, uint8_t **buffer_addr, |
173 | size_t *buffer_sz, void *data) | |
e98a2d6e | 174 | { |
4164020e SM |
175 | enum ctf_msg_iter_medium_status status = CTF_MSG_ITER_MEDIUM_STATUS_OK; |
176 | struct ctf_fs_ds_file *ds_file = (struct ctf_fs_ds_file *) data; | |
4164020e SM |
177 | |
178 | BT_ASSERT(request_sz > 0); | |
179 | ||
180 | /* | |
181 | * Check if we have at least one memory-mapped byte left. If we don't, | |
182 | * mmap the next file. | |
183 | */ | |
184 | if (remaining_mmap_bytes(ds_file) == 0) { | |
185 | /* Are we at the end of the file? */ | |
186 | if (ds_file->mmap_offset_in_file >= ds_file->file->size) { | |
a39d9817 SM |
187 | BT_CPPLOGD_SPEC(ds_file->logger, "Reached end of file \"{}\" ({})", ds_file->file->path, |
188 | fmt::ptr(ds_file->file->fp)); | |
4164020e SM |
189 | status = CTF_MSG_ITER_MEDIUM_STATUS_EOF; |
190 | goto end; | |
191 | } | |
192 | ||
193 | status = ds_file_mmap_next(ds_file); | |
194 | switch (status) { | |
195 | case CTF_MSG_ITER_MEDIUM_STATUS_OK: | |
196 | break; | |
197 | case CTF_MSG_ITER_MEDIUM_STATUS_EOF: | |
198 | goto end; | |
199 | default: | |
0f5c5d5c | 200 | BT_CPPLOGE_SPEC(ds_file->logger, "Cannot memory-map next region of file \"{}\" ({})", |
a39d9817 | 201 | ds_file->file->path, fmt::ptr(ds_file->file->fp)); |
4164020e SM |
202 | goto error; |
203 | } | |
204 | } | |
205 | ||
206 | BT_ASSERT(remaining_mmap_bytes(ds_file) > 0); | |
207 | *buffer_sz = MIN(remaining_mmap_bytes(ds_file), request_sz); | |
208 | ||
209 | BT_ASSERT(ds_file->mmap_addr); | |
210 | *buffer_addr = ((uint8_t *) ds_file->mmap_addr) + ds_file->request_offset_in_mapping; | |
211 | ||
212 | ds_file->request_offset_in_mapping += *buffer_sz; | |
213 | goto end; | |
e98a2d6e PP |
214 | |
215 | error: | |
4164020e | 216 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
e98a2d6e PP |
217 | |
218 | end: | |
4164020e | 219 | return status; |
e98a2d6e PP |
220 | } |
221 | ||
ecd7492f | 222 | static bt_stream *medop_borrow_stream(bt_stream_class *stream_class, int64_t, void *data) |
e98a2d6e | 223 | { |
4164020e SM |
224 | struct ctf_fs_ds_file *ds_file = (struct ctf_fs_ds_file *) data; |
225 | bt_stream_class *ds_file_stream_class; | |
226 | bt_stream *stream = NULL; | |
e5be10ef | 227 | |
265d4ba2 | 228 | ds_file_stream_class = ds_file->stream->cls().libObjPtr(); |
94cf822e | 229 | |
4164020e SM |
230 | if (stream_class != ds_file_stream_class) { |
231 | /* | |
232 | * Not supported: two packets described by two different | |
233 | * stream classes within the same data stream file. | |
234 | */ | |
235 | goto end; | |
236 | } | |
e98a2d6e | 237 | |
265d4ba2 | 238 | stream = ds_file->stream->libObjPtr(); |
94cf822e PP |
239 | |
240 | end: | |
4164020e | 241 | return stream; |
e98a2d6e PP |
242 | } |
243 | ||
4164020e | 244 | static enum ctf_msg_iter_medium_status medop_seek(off_t offset, void *data) |
9e0c8dbb | 245 | { |
4164020e | 246 | struct ctf_fs_ds_file *ds_file = (struct ctf_fs_ds_file *) data; |
9e0c8dbb | 247 | |
4164020e SM |
248 | BT_ASSERT(offset >= 0); |
249 | BT_ASSERT(offset < ds_file->file->size); | |
9e0c8dbb | 250 | |
4164020e | 251 | return ds_file_mmap(ds_file, offset); |
9e0c8dbb JG |
252 | } |
253 | ||
18a1979b | 254 | struct ctf_msg_iter_medium_ops ctf_fs_ds_file_medops = { |
4164020e SM |
255 | medop_request_bytes, |
256 | medop_seek, | |
257 | nullptr, | |
258 | medop_borrow_stream, | |
e98a2d6e | 259 | }; |
6de92955 | 260 | |
4164020e SM |
261 | struct ctf_fs_ds_group_medops_data |
262 | { | |
0f5c5d5c SM |
263 | explicit ctf_fs_ds_group_medops_data(const bt2c::Logger& parentLogger) : |
264 | logger {parentLogger, "PLUGIN/SRC.CTF.FS/DS-GROUP-MEDOPS"} | |
265 | { | |
266 | } | |
267 | ||
268 | bt2c::Logger logger; | |
269 | ||
4164020e | 270 | /* Weak, set once at creation time. */ |
afb0f12b | 271 | struct ctf_fs_ds_file_group *ds_file_group = nullptr; |
4164020e SM |
272 | |
273 | /* | |
274 | * Index (as in element rank) of the index entry of ds_file_groups' | |
275 | * index we will read next (so, the one after the one we are reading | |
276 | * right now). | |
277 | */ | |
afb0f12b | 278 | guint next_index_entry_index = 0; |
4164020e SM |
279 | |
280 | /* | |
281 | * File we are currently reading. Changes whenever we switch to | |
282 | * reading another data file. | |
4164020e | 283 | */ |
55ea683f | 284 | ctf_fs_ds_file::UP file; |
4164020e SM |
285 | |
286 | /* Weak, for context / logging / appending causes. */ | |
afb0f12b | 287 | bt_self_message_iterator *self_msg_iter = nullptr; |
f6e68e70 SM |
288 | }; |
289 | ||
4164020e SM |
290 | static enum ctf_msg_iter_medium_status medop_group_request_bytes(size_t request_sz, |
291 | uint8_t **buffer_addr, | |
292 | size_t *buffer_sz, void *void_data) | |
f6e68e70 | 293 | { |
4164020e | 294 | struct ctf_fs_ds_group_medops_data *data = (struct ctf_fs_ds_group_medops_data *) void_data; |
f6e68e70 | 295 | |
4164020e | 296 | /* Return bytes from the current file. */ |
55ea683f | 297 | return medop_request_bytes(request_sz, buffer_addr, buffer_sz, data->file.get()); |
f6e68e70 SM |
298 | } |
299 | ||
4164020e SM |
300 | static bt_stream *medop_group_borrow_stream(bt_stream_class *stream_class, int64_t stream_id, |
301 | void *void_data) | |
f6e68e70 | 302 | { |
4164020e | 303 | struct ctf_fs_ds_group_medops_data *data = (struct ctf_fs_ds_group_medops_data *) void_data; |
f6e68e70 | 304 | |
55ea683f | 305 | return medop_borrow_stream(stream_class, stream_id, data->file.get()); |
f6e68e70 SM |
306 | } |
307 | ||
308 | /* | |
309 | * Set `data->file` to prepare it to read the packet described | |
310 | * by `index_entry`. | |
311 | */ | |
312 | ||
4164020e SM |
313 | static enum ctf_msg_iter_medium_status |
314 | ctf_fs_ds_group_medops_set_file(struct ctf_fs_ds_group_medops_data *data, | |
0f5c5d5c | 315 | struct ctf_fs_ds_index_entry *index_entry) |
f6e68e70 | 316 | { |
4164020e SM |
317 | enum ctf_msg_iter_medium_status status; |
318 | ||
319 | BT_ASSERT(data); | |
320 | BT_ASSERT(index_entry); | |
321 | ||
322 | /* Check if that file is already the one mapped. */ | |
a39d9817 | 323 | if (!data->file || data->file->file->path != index_entry->path) { |
4164020e | 324 | /* Create the new file. */ |
265d4ba2 SM |
325 | data->file = |
326 | ctf_fs_ds_file_create(data->ds_file_group->ctf_fs_trace, data->ds_file_group->stream, | |
55ea683f | 327 | index_entry->path, data->logger); |
4164020e | 328 | if (!data->file) { |
0f5c5d5c | 329 | BT_CPPLOGE_APPEND_CAUSE_SPEC(data->logger, "failed to create ctf_fs_ds_file."); |
4164020e SM |
330 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
331 | goto end; | |
332 | } | |
333 | } | |
334 | ||
335 | /* | |
336 | * Ensure the right portion of the file will be returned on the next | |
337 | * request_bytes call. | |
338 | */ | |
55ea683f | 339 | status = ds_file_mmap(data->file.get(), index_entry->offset.bytes()); |
4164020e SM |
340 | if (status != CTF_MSG_ITER_MEDIUM_STATUS_OK) { |
341 | goto end; | |
342 | } | |
343 | ||
344 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
f6e68e70 SM |
345 | |
346 | end: | |
4164020e | 347 | return status; |
f6e68e70 SM |
348 | } |
349 | ||
4164020e | 350 | static enum ctf_msg_iter_medium_status medop_group_switch_packet(void *void_data) |
f6e68e70 | 351 | { |
4164020e SM |
352 | struct ctf_fs_ds_group_medops_data *data = (struct ctf_fs_ds_group_medops_data *) void_data; |
353 | struct ctf_fs_ds_index_entry *index_entry; | |
354 | enum ctf_msg_iter_medium_status status; | |
355 | ||
356 | /* If we have gone through all index entries, we are done. */ | |
2fb7af12 | 357 | if (data->next_index_entry_index >= data->ds_file_group->index->entries.size()) { |
4164020e SM |
358 | status = CTF_MSG_ITER_MEDIUM_STATUS_EOF; |
359 | goto end; | |
360 | } | |
361 | ||
362 | /* | |
363 | * Otherwise, look up the next index entry / packet and prepare it | |
364 | * for reading. | |
365 | */ | |
2fb7af12 | 366 | index_entry = data->ds_file_group->index->entries[data->next_index_entry_index].get(); |
4164020e | 367 | |
0f5c5d5c | 368 | status = ctf_fs_ds_group_medops_set_file(data, index_entry); |
4164020e SM |
369 | if (status != CTF_MSG_ITER_MEDIUM_STATUS_OK) { |
370 | goto end; | |
371 | } | |
372 | ||
373 | data->next_index_entry_index++; | |
374 | ||
375 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
f6e68e70 | 376 | end: |
4164020e | 377 | return status; |
f6e68e70 SM |
378 | } |
379 | ||
3cf88182 SM |
380 | void ctf_fs_ds_group_medops_data_deleter::operator()(ctf_fs_ds_group_medops_data *data) noexcept |
381 | { | |
2db013e0 | 382 | delete data; |
3cf88182 SM |
383 | } |
384 | ||
f6e68e70 | 385 | enum ctf_msg_iter_medium_status ctf_fs_ds_group_medops_data_create( |
4164020e | 386 | struct ctf_fs_ds_file_group *ds_file_group, bt_self_message_iterator *self_msg_iter, |
3cf88182 | 387 | const bt2c::Logger& parentLogger, ctf_fs_ds_group_medops_data_up& out) |
f6e68e70 | 388 | { |
4164020e SM |
389 | BT_ASSERT(self_msg_iter); |
390 | BT_ASSERT(ds_file_group); | |
391 | BT_ASSERT(ds_file_group->index); | |
2fb7af12 | 392 | BT_ASSERT(!ds_file_group->index->entries.empty()); |
4164020e | 393 | |
3cf88182 SM |
394 | out.reset(new ctf_fs_ds_group_medops_data {parentLogger}); |
395 | ||
396 | out->ds_file_group = ds_file_group; | |
397 | out->self_msg_iter = self_msg_iter; | |
4164020e SM |
398 | |
399 | /* | |
400 | * No need to prepare the first file. ctf_msg_iter will call | |
401 | * switch_packet before reading the first packet, it will be | |
402 | * done then. | |
403 | */ | |
404 | ||
afb0f12b | 405 | return CTF_MSG_ITER_MEDIUM_STATUS_OK; |
f6e68e70 SM |
406 | } |
407 | ||
408 | void ctf_fs_ds_group_medops_data_reset(struct ctf_fs_ds_group_medops_data *data) | |
409 | { | |
4164020e | 410 | data->next_index_entry_index = 0; |
f6e68e70 SM |
411 | } |
412 | ||
413 | struct ctf_msg_iter_medium_ops ctf_fs_ds_group_medops = { | |
4164020e | 414 | .request_bytes = medop_group_request_bytes, |
f6e68e70 | 415 | |
4164020e SM |
416 | /* |
417 | * We don't support seeking using this medops. It would probably be | |
418 | * possible, but it's not needed at the moment. | |
419 | */ | |
420 | .seek = NULL, | |
087cd0f5 | 421 | |
4164020e SM |
422 | .switch_packet = medop_group_switch_packet, |
423 | .borrow_stream = medop_group_borrow_stream, | |
f6e68e70 SM |
424 | }; |
425 | ||
c05e1405 SM |
426 | static ctf_fs_ds_index_entry::UP ctf_fs_ds_index_entry_create(const bt2c::DataLen offset, |
427 | const bt2c::DataLen packetSize) | |
afb0f12b | 428 | { |
c05e1405 | 429 | ctf_fs_ds_index_entry::UP entry = bt2s::make_unique<ctf_fs_ds_index_entry>(offset, packetSize); |
ef7d7ac2 | 430 | |
4164020e | 431 | entry->packet_seq_num = UINT64_MAX; |
6834784d | 432 | |
4164020e | 433 | return entry; |
6834784d SM |
434 | } |
435 | ||
4164020e | 436 | static int convert_cycles_to_ns(struct ctf_clock_class *clock_class, uint64_t cycles, int64_t *ns) |
b6c3dcb2 | 437 | { |
4164020e SM |
438 | return bt_util_clock_cycles_to_ns_from_origin(cycles, clock_class->frequency, |
439 | clock_class->offset_seconds, | |
440 | clock_class->offset_cycles, ns); | |
97ade20b JG |
441 | } |
442 | ||
441fa755 SM |
443 | static ctf_fs_ds_index::UP build_index_from_idx_file(struct ctf_fs_ds_file *ds_file, |
444 | struct ctf_fs_ds_file_info *file_info, | |
445 | struct ctf_msg_iter *msg_iter) | |
97ade20b | 446 | { |
4164020e SM |
447 | int ret; |
448 | gchar *directory = NULL; | |
449 | gchar *basename = NULL; | |
450 | GString *index_basename = NULL; | |
451 | gchar *index_file_path = NULL; | |
452 | GMappedFile *mapped_file = NULL; | |
453 | gsize filesize; | |
454 | const char *mmap_begin = NULL, *file_pos = NULL; | |
455 | const struct ctf_packet_index_file_hdr *header = NULL; | |
441fa755 | 456 | ctf_fs_ds_index::UP index; |
c05e1405 SM |
457 | ctf_fs_ds_index_entry::UP index_entry; |
458 | ctf_fs_ds_index_entry *prev_index_entry = NULL; | |
ef7d7ac2 | 459 | auto totalPacketsSize = bt2c::DataLen::fromBytes(0); |
4164020e SM |
460 | size_t file_index_entry_size; |
461 | size_t file_entry_count; | |
462 | size_t i; | |
463 | struct ctf_stream_class *sc; | |
464 | struct ctf_msg_iter_packet_properties props; | |
465 | uint32_t version_major, version_minor; | |
4164020e | 466 | |
0f5c5d5c | 467 | BT_CPPLOGI_SPEC(ds_file->logger, "Building index from .idx file of stream file {}", |
a39d9817 | 468 | ds_file->file->path); |
4164020e SM |
469 | ret = ctf_msg_iter_get_packet_properties(msg_iter, &props); |
470 | if (ret) { | |
0f5c5d5c SM |
471 | BT_CPPLOGI_STR_SPEC(ds_file->logger, |
472 | "Cannot read first packet's header and context fields."); | |
4164020e SM |
473 | goto error; |
474 | } | |
475 | ||
476 | sc = ctf_trace_class_borrow_stream_class_by_id(ds_file->metadata->tc, props.stream_class_id); | |
477 | BT_ASSERT(sc); | |
478 | if (!sc->default_clock_class) { | |
0f5c5d5c | 479 | BT_CPPLOGI_STR_SPEC(ds_file->logger, "Cannot find stream class's default clock class."); |
4164020e SM |
480 | goto error; |
481 | } | |
482 | ||
483 | /* Look for index file in relative path index/name.idx. */ | |
a39d9817 | 484 | basename = g_path_get_basename(ds_file->file->path.c_str()); |
4164020e | 485 | if (!basename) { |
0f5c5d5c | 486 | BT_CPPLOGE_SPEC(ds_file->logger, "Cannot get the basename of datastream file {}", |
a39d9817 | 487 | ds_file->file->path); |
4164020e SM |
488 | goto error; |
489 | } | |
490 | ||
a39d9817 | 491 | directory = g_path_get_dirname(ds_file->file->path.c_str()); |
4164020e | 492 | if (!directory) { |
0f5c5d5c | 493 | BT_CPPLOGE_SPEC(ds_file->logger, "Cannot get dirname of datastream file {}", |
a39d9817 | 494 | ds_file->file->path); |
4164020e SM |
495 | goto error; |
496 | } | |
497 | ||
498 | index_basename = g_string_new(basename); | |
499 | if (!index_basename) { | |
0f5c5d5c | 500 | BT_CPPLOGE_STR_SPEC(ds_file->logger, "Cannot allocate index file basename string"); |
4164020e SM |
501 | goto error; |
502 | } | |
503 | ||
504 | g_string_append(index_basename, ".idx"); | |
505 | index_file_path = g_build_filename(directory, "index", index_basename->str, NULL); | |
506 | mapped_file = g_mapped_file_new(index_file_path, FALSE, NULL); | |
507 | if (!mapped_file) { | |
0f5c5d5c | 508 | BT_CPPLOGD_SPEC(ds_file->logger, "Cannot create new mapped file {}", index_file_path); |
4164020e SM |
509 | goto error; |
510 | } | |
511 | ||
512 | /* | |
513 | * The g_mapped_file API limits us to 4GB files on 32-bit. | |
514 | * Traces with such large indexes have never been seen in the wild, | |
515 | * but this would need to be adjusted to support them. | |
516 | */ | |
517 | filesize = g_mapped_file_get_length(mapped_file); | |
518 | if (filesize < sizeof(*header)) { | |
0f5c5d5c SM |
519 | BT_CPPLOGW_SPEC(ds_file->logger, |
520 | "Invalid LTTng trace index file: " | |
521 | "file size ({} bytes) < header size ({} bytes)", | |
522 | filesize, sizeof(*header)); | |
4164020e SM |
523 | goto error; |
524 | } | |
525 | ||
526 | mmap_begin = g_mapped_file_get_contents(mapped_file); | |
527 | header = (struct ctf_packet_index_file_hdr *) mmap_begin; | |
528 | ||
529 | file_pos = g_mapped_file_get_contents(mapped_file) + sizeof(*header); | |
530 | if (be32toh(header->magic) != CTF_INDEX_MAGIC) { | |
0f5c5d5c SM |
531 | BT_CPPLOGW_STR_SPEC(ds_file->logger, |
532 | "Invalid LTTng trace index: \"magic\" field validation failed"); | |
4164020e SM |
533 | goto error; |
534 | } | |
535 | ||
536 | version_major = be32toh(header->index_major); | |
537 | version_minor = be32toh(header->index_minor); | |
538 | if (version_major != 1) { | |
0f5c5d5c SM |
539 | BT_CPPLOGW_SPEC(ds_file->logger, "Unknown LTTng trace index version: major={}, minor={}", |
540 | version_major, version_minor); | |
4164020e SM |
541 | goto error; |
542 | } | |
543 | ||
544 | file_index_entry_size = be32toh(header->packet_index_len); | |
545 | if (file_index_entry_size < CTF_INDEX_1_0_SIZE) { | |
0f5c5d5c SM |
546 | BT_CPPLOGW_SPEC( |
547 | ds_file->logger, | |
4164020e | 548 | "Invalid `packet_index_len` in LTTng trace index file (`packet_index_len` < CTF index 1.0 index entry size): " |
0f5c5d5c | 549 | "packet_index_len={}, CTF_INDEX_1_0_SIZE={}", |
4164020e SM |
550 | file_index_entry_size, CTF_INDEX_1_0_SIZE); |
551 | goto error; | |
552 | } | |
553 | ||
554 | file_entry_count = (filesize - sizeof(*header)) / file_index_entry_size; | |
555 | if ((filesize - sizeof(*header)) % file_index_entry_size) { | |
0f5c5d5c SM |
556 | BT_CPPLOGW_SPEC(ds_file->logger, |
557 | "Invalid LTTng trace index: the index's size after the header " | |
558 | "({} bytes) is not a multiple of the index entry size " | |
559 | "({} bytes)", | |
560 | (filesize - sizeof(*header)), sizeof(*header)); | |
4164020e SM |
561 | goto error; |
562 | } | |
563 | ||
19d9bb23 | 564 | index = bt2s::make_unique<ctf_fs_ds_index>(); |
4164020e SM |
565 | |
566 | for (i = 0; i < file_entry_count; i++) { | |
567 | struct ctf_packet_index *file_index = (struct ctf_packet_index *) file_pos; | |
ef7d7ac2 | 568 | const auto packetSize = bt2c::DataLen::fromBits(be64toh(file_index->packet_size)); |
4164020e | 569 | |
ef7d7ac2 | 570 | if (packetSize.hasExtraBits()) { |
0f5c5d5c SM |
571 | BT_CPPLOGW_SPEC(ds_file->logger, |
572 | "Invalid packet size encountered in LTTng trace index file"); | |
4164020e SM |
573 | goto error; |
574 | } | |
575 | ||
ef7d7ac2 SM |
576 | const auto offset = bt2c::DataLen::fromBytes(be64toh(file_index->offset)); |
577 | ||
578 | if (i != 0 && offset < prev_index_entry->offset) { | |
579 | BT_CPPLOGW_SPEC( | |
580 | ds_file->logger, | |
581 | "Invalid, non-monotonic, packet offset encountered in LTTng trace index file: " | |
582 | "previous offset={} bytes, current offset={} bytes", | |
583 | prev_index_entry->offset.bytes(), offset.bytes()); | |
584 | goto error; | |
585 | } | |
586 | ||
587 | index_entry = ctf_fs_ds_index_entry_create(offset, packetSize); | |
4164020e | 588 | if (!index_entry) { |
0f5c5d5c SM |
589 | BT_CPPLOGE_APPEND_CAUSE_SPEC(ds_file->logger, |
590 | "Failed to create a ctf_fs_ds_index_entry."); | |
4164020e SM |
591 | goto error; |
592 | } | |
593 | ||
594 | /* Set path to stream file. */ | |
4d199954 | 595 | index_entry->path = file_info->path.c_str(); |
4164020e | 596 | |
4164020e SM |
597 | index_entry->timestamp_begin = be64toh(file_index->timestamp_begin); |
598 | index_entry->timestamp_end = be64toh(file_index->timestamp_end); | |
599 | if (index_entry->timestamp_end < index_entry->timestamp_begin) { | |
0f5c5d5c SM |
600 | BT_CPPLOGW_SPEC( |
601 | ds_file->logger, | |
4164020e | 602 | "Invalid packet time bounds encountered in LTTng trace index file (begin > end): " |
0f5c5d5c | 603 | "timestamp_begin={}, timestamp_end={}", |
4164020e SM |
604 | index_entry->timestamp_begin, index_entry->timestamp_end); |
605 | goto error; | |
606 | } | |
607 | ||
608 | /* Convert the packet's bound to nanoseconds since Epoch. */ | |
609 | ret = convert_cycles_to_ns(sc->default_clock_class, index_entry->timestamp_begin, | |
610 | &index_entry->timestamp_begin_ns); | |
611 | if (ret) { | |
0f5c5d5c SM |
612 | BT_CPPLOGI_STR_SPEC( |
613 | ds_file->logger, | |
4164020e SM |
614 | "Failed to convert raw timestamp to nanoseconds since Epoch during index parsing"); |
615 | goto error; | |
616 | } | |
617 | ret = convert_cycles_to_ns(sc->default_clock_class, index_entry->timestamp_end, | |
618 | &index_entry->timestamp_end_ns); | |
619 | if (ret) { | |
0f5c5d5c SM |
620 | BT_CPPLOGI_STR_SPEC( |
621 | ds_file->logger, | |
4164020e SM |
622 | "Failed to convert raw timestamp to nanoseconds since Epoch during LTTng trace index parsing"); |
623 | goto error; | |
624 | } | |
625 | ||
626 | if (version_minor >= 1) { | |
627 | index_entry->packet_seq_num = be64toh(file_index->packet_seq_num); | |
628 | } | |
629 | ||
ef7d7ac2 | 630 | totalPacketsSize += packetSize; |
4164020e SM |
631 | file_pos += file_index_entry_size; |
632 | ||
c05e1405 | 633 | prev_index_entry = index_entry.get(); |
4164020e | 634 | |
2fb7af12 | 635 | index->entries.emplace_back(std::move(index_entry)); |
4164020e SM |
636 | } |
637 | ||
638 | /* Validate that the index addresses the complete stream. */ | |
ef7d7ac2 | 639 | if (ds_file->file->size != totalPacketsSize.bytes()) { |
0f5c5d5c SM |
640 | BT_CPPLOGW_SPEC(ds_file->logger, |
641 | "Invalid LTTng trace index file; indexed size != stream file size: " | |
ef7d7ac2 SM |
642 | "file-size={} bytes, total-packets-size={} bytes", |
643 | ds_file->file->size, totalPacketsSize.bytes()); | |
4164020e SM |
644 | goto error; |
645 | } | |
b6c3dcb2 | 646 | end: |
4164020e SM |
647 | g_free(directory); |
648 | g_free(basename); | |
649 | g_free(index_file_path); | |
650 | if (index_basename) { | |
651 | g_string_free(index_basename, TRUE); | |
652 | } | |
653 | if (mapped_file) { | |
654 | g_mapped_file_unref(mapped_file); | |
655 | } | |
656 | return index; | |
97ade20b | 657 | error: |
441fa755 | 658 | index.reset(); |
4164020e | 659 | goto end; |
b6c3dcb2 JG |
660 | } |
661 | ||
4164020e | 662 | static int init_index_entry(struct ctf_fs_ds_index_entry *entry, struct ctf_fs_ds_file *ds_file, |
ef7d7ac2 | 663 | struct ctf_msg_iter_packet_properties *props) |
9e0c8dbb | 664 | { |
4164020e SM |
665 | int ret = 0; |
666 | struct ctf_stream_class *sc; | |
4164020e SM |
667 | |
668 | sc = ctf_trace_class_borrow_stream_class_by_id(ds_file->metadata->tc, props->stream_class_id); | |
669 | BT_ASSERT(sc); | |
4164020e SM |
670 | |
671 | if (props->snapshots.beginning_clock != UINT64_C(-1)) { | |
672 | entry->timestamp_begin = props->snapshots.beginning_clock; | |
673 | ||
674 | /* Convert the packet's bound to nanoseconds since Epoch. */ | |
675 | ret = convert_cycles_to_ns(sc->default_clock_class, props->snapshots.beginning_clock, | |
676 | &entry->timestamp_begin_ns); | |
677 | if (ret) { | |
0f5c5d5c SM |
678 | BT_CPPLOGI_STR_SPEC(ds_file->logger, |
679 | "Failed to convert raw timestamp to nanoseconds since Epoch."); | |
4164020e SM |
680 | goto end; |
681 | } | |
682 | } else { | |
683 | entry->timestamp_begin = UINT64_C(-1); | |
684 | entry->timestamp_begin_ns = UINT64_C(-1); | |
685 | } | |
686 | ||
687 | if (props->snapshots.end_clock != UINT64_C(-1)) { | |
688 | entry->timestamp_end = props->snapshots.end_clock; | |
689 | ||
690 | /* Convert the packet's bound to nanoseconds since Epoch. */ | |
691 | ret = convert_cycles_to_ns(sc->default_clock_class, props->snapshots.end_clock, | |
692 | &entry->timestamp_end_ns); | |
693 | if (ret) { | |
0f5c5d5c SM |
694 | BT_CPPLOGI_STR_SPEC(ds_file->logger, |
695 | "Failed to convert raw timestamp to nanoseconds since Epoch."); | |
4164020e SM |
696 | goto end; |
697 | } | |
698 | } else { | |
699 | entry->timestamp_end = UINT64_C(-1); | |
700 | entry->timestamp_end_ns = UINT64_C(-1); | |
701 | } | |
0b29603d | 702 | |
9e0c8dbb | 703 | end: |
4164020e | 704 | return ret; |
9e0c8dbb JG |
705 | } |
706 | ||
441fa755 SM |
707 | static ctf_fs_ds_index::UP build_index_from_stream_file(struct ctf_fs_ds_file *ds_file, |
708 | struct ctf_fs_ds_file_info *file_info, | |
709 | struct ctf_msg_iter *msg_iter) | |
9e0c8dbb | 710 | { |
4164020e | 711 | int ret; |
4164020e | 712 | enum ctf_msg_iter_status iter_status = CTF_MSG_ITER_STATUS_OK; |
ef7d7ac2 | 713 | auto currentPacketOffset = bt2c::DataLen::fromBytes(0); |
4164020e | 714 | |
a39d9817 | 715 | BT_CPPLOGI_SPEC(ds_file->logger, "Indexing stream file {}", ds_file->file->path); |
4164020e | 716 | |
19d9bb23 | 717 | ctf_fs_ds_index::UP index = bt2s::make_unique<ctf_fs_ds_index>(); |
4164020e SM |
718 | |
719 | while (true) { | |
4164020e SM |
720 | struct ctf_msg_iter_packet_properties props; |
721 | ||
ef7d7ac2 | 722 | if (currentPacketOffset.bytes() > ds_file->file->size) { |
0f5c5d5c SM |
723 | BT_CPPLOGE_STR_SPEC(ds_file->logger, |
724 | "Unexpected current packet's offset (larger than file)."); | |
4164020e | 725 | goto error; |
ef7d7ac2 | 726 | } else if (currentPacketOffset.bytes() == ds_file->file->size) { |
4164020e SM |
727 | /* No more data */ |
728 | break; | |
729 | } | |
730 | ||
ef7d7ac2 | 731 | iter_status = ctf_msg_iter_seek(msg_iter, currentPacketOffset.bytes()); |
4164020e SM |
732 | if (iter_status != CTF_MSG_ITER_STATUS_OK) { |
733 | goto error; | |
734 | } | |
735 | ||
736 | iter_status = ctf_msg_iter_get_packet_properties(msg_iter, &props); | |
737 | if (iter_status != CTF_MSG_ITER_STATUS_OK) { | |
738 | goto error; | |
739 | } | |
740 | ||
ef7d7ac2 SM |
741 | /* |
742 | * Get the current packet size from the packet header, if set. Else, | |
743 | * assume there is a single packet in the file, so take the file size | |
744 | * as the packet size. | |
745 | */ | |
746 | const auto currentPacketSize = props.exp_packet_total_size >= 0 ? | |
747 | bt2c::DataLen::fromBits(props.exp_packet_total_size) : | |
748 | bt2c::DataLen::fromBytes(ds_file->file->size); | |
4164020e | 749 | |
ef7d7ac2 | 750 | if ((currentPacketOffset + currentPacketSize).bytes() > ds_file->file->size) { |
0f5c5d5c SM |
751 | BT_CPPLOGW_SPEC(ds_file->logger, |
752 | "Invalid packet size reported in file: stream=\"{}\", " | |
ef7d7ac2 SM |
753 | "packet-offset-bytes={}, packet-size-bytes={}, " |
754 | "file-size-bytes={}", | |
a39d9817 | 755 | ds_file->file->path, currentPacketOffset.bytes(), |
ef7d7ac2 | 756 | currentPacketSize.bytes(), ds_file->file->size); |
4164020e SM |
757 | goto error; |
758 | } | |
759 | ||
c05e1405 | 760 | auto index_entry = ctf_fs_ds_index_entry_create(currentPacketOffset, currentPacketSize); |
4164020e | 761 | if (!index_entry) { |
0f5c5d5c SM |
762 | BT_CPPLOGE_APPEND_CAUSE_SPEC(ds_file->logger, |
763 | "Failed to create a ctf_fs_ds_index_entry."); | |
4164020e SM |
764 | goto error; |
765 | } | |
766 | ||
767 | /* Set path to stream file. */ | |
4d199954 | 768 | index_entry->path = file_info->path.c_str(); |
4164020e | 769 | |
c05e1405 | 770 | ret = init_index_entry(index_entry.get(), ds_file, &props); |
4164020e | 771 | if (ret) { |
4164020e SM |
772 | goto error; |
773 | } | |
774 | ||
2fb7af12 | 775 | index->entries.emplace_back(std::move(index_entry)); |
4164020e | 776 | |
ef7d7ac2 | 777 | currentPacketOffset += currentPacketSize; |
0f5c5d5c | 778 | BT_CPPLOGD_SPEC(ds_file->logger, |
ef7d7ac2 SM |
779 | "Seeking to next packet: current-packet-offset-bytes={}, " |
780 | "next-packet-offset-bytes={}", | |
781 | (currentPacketOffset - currentPacketSize).bytes(), | |
782 | currentPacketOffset.bytes()); | |
4164020e | 783 | } |
312c056a | 784 | |
9e0c8dbb | 785 | end: |
4164020e | 786 | return index; |
312c056a | 787 | |
9e0c8dbb | 788 | error: |
441fa755 | 789 | index.reset(); |
4164020e | 790 | goto end; |
9e0c8dbb JG |
791 | } |
792 | ||
89f88383 SM |
793 | ctf_fs_ds_file::UP ctf_fs_ds_file_create(struct ctf_fs_trace *ctf_fs_trace, |
794 | bt2::Stream::Shared stream, const char *path, | |
795 | const bt2c::Logger& parentLogger) | |
e98a2d6e | 796 | { |
4164020e | 797 | int ret; |
89f88383 | 798 | auto ds_file = bt2s::make_unique<ctf_fs_ds_file>(parentLogger); |
0f5c5d5c | 799 | size_t offset_align; |
4164020e | 800 | |
4726b1ee | 801 | ds_file->file = bt2s::make_unique<ctf_fs_file>(parentLogger); |
265d4ba2 | 802 | ds_file->stream = std::move(stream); |
2dba3a29 | 803 | ds_file->metadata = ctf_fs_trace->metadata.get(); |
a39d9817 | 804 | ds_file->file->path = path; |
c44dc433 | 805 | ret = ctf_fs_file_open(ds_file->file.get(), "rb"); |
4164020e SM |
806 | if (ret) { |
807 | goto error; | |
808 | } | |
809 | ||
0f5c5d5c | 810 | offset_align = bt_mmap_get_offset_align_size(static_cast<int>(ds_file->logger.level())); |
4164020e SM |
811 | ds_file->mmap_max_len = offset_align * 2048; |
812 | ||
813 | goto end; | |
1a9f7075 | 814 | |
e98a2d6e | 815 | error: |
4164020e | 816 | /* Do not touch "borrowed" file. */ |
89f88383 | 817 | ds_file.reset(); |
1a9f7075 | 818 | |
e98a2d6e | 819 | end: |
4164020e | 820 | return ds_file; |
e98a2d6e PP |
821 | } |
822 | ||
441fa755 SM |
823 | ctf_fs_ds_index::UP ctf_fs_ds_file_build_index(struct ctf_fs_ds_file *ds_file, |
824 | struct ctf_fs_ds_file_info *file_info, | |
825 | struct ctf_msg_iter *msg_iter) | |
97ade20b | 826 | { |
441fa755 | 827 | auto index = build_index_from_idx_file(ds_file, file_info, msg_iter); |
4164020e SM |
828 | if (index) { |
829 | goto end; | |
830 | } | |
831 | ||
0f5c5d5c SM |
832 | BT_CPPLOGI_SPEC(ds_file->logger, "Failed to build index from .index file; " |
833 | "falling back to stream indexing."); | |
4164020e | 834 | index = build_index_from_stream_file(ds_file, file_info, msg_iter); |
9e0c8dbb | 835 | end: |
4164020e | 836 | return index; |
97ade20b JG |
837 | } |
838 | ||
3199f1ba | 839 | ctf_fs_ds_file::~ctf_fs_ds_file() |
e98a2d6e | 840 | { |
3199f1ba | 841 | (void) ds_file_munmap(this); |
e98a2d6e | 842 | } |
4f1f88a6 | 843 | |
2cef6403 | 844 | ctf_fs_ds_file_info::UP ctf_fs_ds_file_info_create(const char *path, int64_t begin_ns) |
873c329a | 845 | { |
2cef6403 | 846 | ctf_fs_ds_file_info::UP ds_file_info = bt2s::make_unique<ctf_fs_ds_file_info>(); |
873c329a | 847 | |
4d199954 | 848 | ds_file_info->path = path; |
873c329a | 849 | ds_file_info->begin_ns = begin_ns; |
873c329a SM |
850 | return ds_file_info; |
851 | } | |
852 | ||
fe2e19c4 SM |
853 | ctf_fs_ds_file_group::UP ctf_fs_ds_file_group_create(struct ctf_fs_trace *ctf_fs_trace, |
854 | struct ctf_stream_class *sc, | |
855 | uint64_t stream_instance_id, | |
fe2f9cda | 856 | ctf_fs_ds_index::UP index) |
fe2e19c4 SM |
857 | { |
858 | ctf_fs_ds_file_group::UP ds_file_group {new ctf_fs_ds_file_group}; | |
859 | ||
fe2f9cda | 860 | ds_file_group->index = std::move(index); |
873c329a SM |
861 | |
862 | ds_file_group->stream_id = stream_instance_id; | |
863 | BT_ASSERT(sc); | |
864 | ds_file_group->sc = sc; | |
865 | ds_file_group->ctf_fs_trace = ctf_fs_trace; | |
873c329a | 866 | |
873c329a SM |
867 | return ds_file_group; |
868 | } |