Commit | Line | Data |
---|---|---|
e98a2d6e | 1 | /* |
0235b0db | 2 | * SPDX-License-Identifier: MIT |
e98a2d6e | 3 | * |
0235b0db MJ |
4 | * Copyright 2016-2017 Philippe Proulx <pproulx@efficios.com> |
5 | * Copyright 2016 Jérémie Galarneau <jeremie.galarneau@efficios.com> | |
6 | * Copyright 2010-2011 EfficiOS Inc. and Linux Foundation | |
e98a2d6e PP |
7 | */ |
8 | ||
c802cacb | 9 | #include <glib.h> |
c802cacb SM |
10 | #include <stdint.h> |
11 | #include <stdio.h> | |
c802cacb | 12 | |
83ad336c | 13 | #include "compat/endian.h" /* IWYU pragma: keep */ |
0f5c5d5c | 14 | #include "compat/mman.h" /* IWYU: pragma keep */ |
2cef6403 | 15 | #include "cpp-common/bt2s/make-unique.hpp" |
0f5c5d5c | 16 | #include "cpp-common/vendor/fmt/format.h" |
c802cacb | 17 | |
5656cea5 | 18 | #include "../common/src/msg-iter/msg-iter.hpp" |
087cd0f5 | 19 | #include "data-stream-file.hpp" |
c802cacb | 20 | #include "file.hpp" |
c7e1be4b SM |
21 | #include "fs.hpp" |
22 | #include "lttng-index.hpp" | |
e98a2d6e | 23 | |
4164020e | 24 | static inline size_t remaining_mmap_bytes(struct ctf_fs_ds_file *ds_file) |
e98a2d6e | 25 | { |
4164020e SM |
26 | BT_ASSERT_DBG(ds_file->mmap_len >= ds_file->request_offset_in_mapping); |
27 | return ds_file->mmap_len - ds_file->request_offset_in_mapping; | |
e98a2d6e PP |
28 | } |
29 | ||
127e2341 SM |
30 | /* |
31 | * Return true if `offset_in_file` is in the current mapping. | |
32 | */ | |
33 | ||
4164020e | 34 | static bool offset_ist_mapped(struct ctf_fs_ds_file *ds_file, off_t offset_in_file) |
127e2341 | 35 | { |
4164020e SM |
36 | return offset_in_file >= ds_file->mmap_offset_in_file && |
37 | offset_in_file < (ds_file->mmap_offset_in_file + ds_file->mmap_len); | |
127e2341 SM |
38 | } |
39 | ||
4164020e | 40 | static enum ctf_msg_iter_medium_status ds_file_munmap(struct ctf_fs_ds_file *ds_file) |
e98a2d6e | 41 | { |
4164020e | 42 | enum ctf_msg_iter_medium_status status; |
4164020e SM |
43 | |
44 | BT_ASSERT(ds_file); | |
45 | ||
46 | if (!ds_file->mmap_addr) { | |
47 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
48 | goto end; | |
49 | } | |
50 | ||
51 | if (bt_munmap(ds_file->mmap_addr, ds_file->mmap_len)) { | |
0f5c5d5c SM |
52 | BT_CPPLOGE_ERRNO_SPEC(ds_file->logger, "Cannot memory-unmap file", |
53 | ": address={}, size={}, file_path=\"{}\", file={}", | |
54 | fmt::ptr(ds_file->mmap_addr), ds_file->mmap_len, | |
a39d9817 | 55 | ds_file->file ? ds_file->file->path : "NULL", |
0f5c5d5c | 56 | ds_file->file ? fmt::ptr(ds_file->file->fp) : NULL); |
4164020e SM |
57 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
58 | goto end; | |
59 | } | |
60 | ||
61 | ds_file->mmap_addr = NULL; | |
62 | ||
63 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
fc9a526c | 64 | end: |
4164020e | 65 | return status; |
e98a2d6e PP |
66 | } |
67 | ||
127e2341 SM |
68 | /* |
69 | * mmap a region of `ds_file` such that `requested_offset_in_file` is in the | |
70 | * mapping. If the currently mmap-ed region already contains | |
71 | * `requested_offset_in_file`, the mapping is kept. | |
72 | * | |
f6e68e70 SM |
73 | * Set `ds_file->requested_offset_in_mapping` based on `request_offset_in_file`, |
74 | * such that the next call to `request_bytes` will return bytes starting at that | |
75 | * position. | |
127e2341 SM |
76 | * |
77 | * `requested_offset_in_file` must be a valid offset in the file. | |
78 | */ | |
4164020e SM |
79 | static enum ctf_msg_iter_medium_status ds_file_mmap(struct ctf_fs_ds_file *ds_file, |
80 | off_t requested_offset_in_file) | |
e98a2d6e | 81 | { |
4164020e | 82 | enum ctf_msg_iter_medium_status status; |
4164020e SM |
83 | |
84 | /* Ensure the requested offset is in the file range. */ | |
85 | BT_ASSERT(requested_offset_in_file >= 0); | |
86 | BT_ASSERT(requested_offset_in_file < ds_file->file->size); | |
87 | ||
88 | /* | |
89 | * If the mapping already contains the requested offset, just adjust | |
90 | * requested_offset_in_mapping. | |
91 | */ | |
92 | if (offset_ist_mapped(ds_file, requested_offset_in_file)) { | |
93 | ds_file->request_offset_in_mapping = | |
94 | requested_offset_in_file - ds_file->mmap_offset_in_file; | |
95 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
96 | goto end; | |
97 | } | |
98 | ||
99 | /* Unmap old region */ | |
100 | status = ds_file_munmap(ds_file); | |
101 | if (status != CTF_MSG_ITER_MEDIUM_STATUS_OK) { | |
102 | goto end; | |
103 | } | |
104 | ||
105 | /* | |
106 | * Compute a mapping that has the required alignment properties and | |
107 | * contains `requested_offset_in_file`. | |
108 | */ | |
109 | ds_file->request_offset_in_mapping = | |
0f5c5d5c SM |
110 | requested_offset_in_file % |
111 | bt_mmap_get_offset_align_size(static_cast<int>(ds_file->logger.level())); | |
4164020e SM |
112 | ds_file->mmap_offset_in_file = requested_offset_in_file - ds_file->request_offset_in_mapping; |
113 | ds_file->mmap_len = | |
114 | MIN(ds_file->file->size - ds_file->mmap_offset_in_file, ds_file->mmap_max_len); | |
115 | ||
116 | BT_ASSERT(ds_file->mmap_len > 0); | |
117 | ||
118 | ds_file->mmap_addr = | |
85a25425 | 119 | bt_mmap(ds_file->mmap_len, PROT_READ, MAP_PRIVATE, fileno(ds_file->file->fp.get()), |
0f5c5d5c | 120 | ds_file->mmap_offset_in_file, static_cast<int>(ds_file->logger.level())); |
4164020e | 121 | if (ds_file->mmap_addr == MAP_FAILED) { |
0f5c5d5c SM |
122 | BT_CPPLOGE_SPEC(ds_file->logger, |
123 | "Cannot memory-map address (size {}) of file \"{}\" ({}) at offset {}: {}", | |
a39d9817 | 124 | ds_file->mmap_len, ds_file->file->path, fmt::ptr(ds_file->file->fp), |
0f5c5d5c | 125 | (intmax_t) ds_file->mmap_offset_in_file, strerror(errno)); |
4164020e SM |
126 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
127 | goto end; | |
128 | } | |
129 | ||
130 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
127e2341 SM |
131 | |
132 | end: | |
4164020e | 133 | return status; |
127e2341 SM |
134 | } |
135 | ||
136 | /* | |
137 | * Change the mapping of the file to read the region that follows the current | |
138 | * mapping. | |
139 | * | |
140 | * If the file hasn't been mapped yet, then everything (mmap_offset_in_file, | |
141 | * mmap_len, request_offset_in_mapping) should have the value 0, which will | |
142 | * result in the beginning of the file getting mapped. | |
143 | * | |
144 | * return _EOF if the current mapping is the end of the file. | |
145 | */ | |
146 | ||
4164020e | 147 | static enum ctf_msg_iter_medium_status ds_file_mmap_next(struct ctf_fs_ds_file *ds_file) |
127e2341 | 148 | { |
4164020e SM |
149 | enum ctf_msg_iter_medium_status status; |
150 | ||
151 | /* | |
152 | * If we're called, it's because more bytes are requested but we have | |
153 | * given all the bytes of the current mapping. | |
154 | */ | |
155 | BT_ASSERT(ds_file->request_offset_in_mapping == ds_file->mmap_len); | |
156 | ||
157 | /* | |
158 | * If the current mapping coincides with the end of the file, there is | |
159 | * no next mapping. | |
160 | */ | |
161 | if (ds_file->mmap_offset_in_file + ds_file->mmap_len == ds_file->file->size) { | |
162 | status = CTF_MSG_ITER_MEDIUM_STATUS_EOF; | |
163 | goto end; | |
164 | } | |
165 | ||
166 | status = ds_file_mmap(ds_file, ds_file->mmap_offset_in_file + ds_file->mmap_len); | |
127e2341 | 167 | |
e98a2d6e | 168 | end: |
4164020e | 169 | return status; |
e98a2d6e PP |
170 | } |
171 | ||
4164020e SM |
172 | static enum ctf_msg_iter_medium_status medop_request_bytes(size_t request_sz, uint8_t **buffer_addr, |
173 | size_t *buffer_sz, void *data) | |
e98a2d6e | 174 | { |
4164020e SM |
175 | enum ctf_msg_iter_medium_status status = CTF_MSG_ITER_MEDIUM_STATUS_OK; |
176 | struct ctf_fs_ds_file *ds_file = (struct ctf_fs_ds_file *) data; | |
4164020e SM |
177 | |
178 | BT_ASSERT(request_sz > 0); | |
179 | ||
180 | /* | |
181 | * Check if we have at least one memory-mapped byte left. If we don't, | |
182 | * mmap the next file. | |
183 | */ | |
184 | if (remaining_mmap_bytes(ds_file) == 0) { | |
185 | /* Are we at the end of the file? */ | |
186 | if (ds_file->mmap_offset_in_file >= ds_file->file->size) { | |
a39d9817 SM |
187 | BT_CPPLOGD_SPEC(ds_file->logger, "Reached end of file \"{}\" ({})", ds_file->file->path, |
188 | fmt::ptr(ds_file->file->fp)); | |
4164020e SM |
189 | status = CTF_MSG_ITER_MEDIUM_STATUS_EOF; |
190 | goto end; | |
191 | } | |
192 | ||
193 | status = ds_file_mmap_next(ds_file); | |
194 | switch (status) { | |
195 | case CTF_MSG_ITER_MEDIUM_STATUS_OK: | |
196 | break; | |
197 | case CTF_MSG_ITER_MEDIUM_STATUS_EOF: | |
198 | goto end; | |
199 | default: | |
0f5c5d5c | 200 | BT_CPPLOGE_SPEC(ds_file->logger, "Cannot memory-map next region of file \"{}\" ({})", |
a39d9817 | 201 | ds_file->file->path, fmt::ptr(ds_file->file->fp)); |
4164020e SM |
202 | goto error; |
203 | } | |
204 | } | |
205 | ||
206 | BT_ASSERT(remaining_mmap_bytes(ds_file) > 0); | |
207 | *buffer_sz = MIN(remaining_mmap_bytes(ds_file), request_sz); | |
208 | ||
209 | BT_ASSERT(ds_file->mmap_addr); | |
210 | *buffer_addr = ((uint8_t *) ds_file->mmap_addr) + ds_file->request_offset_in_mapping; | |
211 | ||
212 | ds_file->request_offset_in_mapping += *buffer_sz; | |
213 | goto end; | |
e98a2d6e PP |
214 | |
215 | error: | |
4164020e | 216 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
e98a2d6e PP |
217 | |
218 | end: | |
4164020e | 219 | return status; |
e98a2d6e PP |
220 | } |
221 | ||
ecd7492f | 222 | static bt_stream *medop_borrow_stream(bt_stream_class *stream_class, int64_t, void *data) |
e98a2d6e | 223 | { |
4164020e SM |
224 | struct ctf_fs_ds_file *ds_file = (struct ctf_fs_ds_file *) data; |
225 | bt_stream_class *ds_file_stream_class; | |
226 | bt_stream *stream = NULL; | |
e5be10ef | 227 | |
265d4ba2 | 228 | ds_file_stream_class = ds_file->stream->cls().libObjPtr(); |
94cf822e | 229 | |
4164020e SM |
230 | if (stream_class != ds_file_stream_class) { |
231 | /* | |
232 | * Not supported: two packets described by two different | |
233 | * stream classes within the same data stream file. | |
234 | */ | |
235 | goto end; | |
236 | } | |
e98a2d6e | 237 | |
265d4ba2 | 238 | stream = ds_file->stream->libObjPtr(); |
94cf822e PP |
239 | |
240 | end: | |
4164020e | 241 | return stream; |
e98a2d6e PP |
242 | } |
243 | ||
4164020e | 244 | static enum ctf_msg_iter_medium_status medop_seek(off_t offset, void *data) |
9e0c8dbb | 245 | { |
4164020e | 246 | struct ctf_fs_ds_file *ds_file = (struct ctf_fs_ds_file *) data; |
9e0c8dbb | 247 | |
4164020e SM |
248 | BT_ASSERT(offset >= 0); |
249 | BT_ASSERT(offset < ds_file->file->size); | |
9e0c8dbb | 250 | |
4164020e | 251 | return ds_file_mmap(ds_file, offset); |
9e0c8dbb JG |
252 | } |
253 | ||
18a1979b | 254 | struct ctf_msg_iter_medium_ops ctf_fs_ds_file_medops = { |
4164020e SM |
255 | medop_request_bytes, |
256 | medop_seek, | |
257 | nullptr, | |
258 | medop_borrow_stream, | |
e98a2d6e | 259 | }; |
6de92955 | 260 | |
4164020e SM |
261 | struct ctf_fs_ds_group_medops_data |
262 | { | |
0f5c5d5c SM |
263 | explicit ctf_fs_ds_group_medops_data(const bt2c::Logger& parentLogger) : |
264 | logger {parentLogger, "PLUGIN/SRC.CTF.FS/DS-GROUP-MEDOPS"} | |
265 | { | |
266 | } | |
267 | ||
268 | bt2c::Logger logger; | |
269 | ||
4164020e | 270 | /* Weak, set once at creation time. */ |
afb0f12b | 271 | struct ctf_fs_ds_file_group *ds_file_group = nullptr; |
4164020e SM |
272 | |
273 | /* | |
274 | * Index (as in element rank) of the index entry of ds_file_groups' | |
275 | * index we will read next (so, the one after the one we are reading | |
276 | * right now). | |
277 | */ | |
afb0f12b | 278 | guint next_index_entry_index = 0; |
4164020e SM |
279 | |
280 | /* | |
281 | * File we are currently reading. Changes whenever we switch to | |
282 | * reading another data file. | |
283 | * | |
284 | * Owned by this. | |
285 | */ | |
afb0f12b | 286 | struct ctf_fs_ds_file *file = nullptr; |
4164020e SM |
287 | |
288 | /* Weak, for context / logging / appending causes. */ | |
afb0f12b | 289 | bt_self_message_iterator *self_msg_iter = nullptr; |
f6e68e70 SM |
290 | }; |
291 | ||
4164020e SM |
292 | static enum ctf_msg_iter_medium_status medop_group_request_bytes(size_t request_sz, |
293 | uint8_t **buffer_addr, | |
294 | size_t *buffer_sz, void *void_data) | |
f6e68e70 | 295 | { |
4164020e | 296 | struct ctf_fs_ds_group_medops_data *data = (struct ctf_fs_ds_group_medops_data *) void_data; |
f6e68e70 | 297 | |
4164020e SM |
298 | /* Return bytes from the current file. */ |
299 | return medop_request_bytes(request_sz, buffer_addr, buffer_sz, data->file); | |
f6e68e70 SM |
300 | } |
301 | ||
4164020e SM |
302 | static bt_stream *medop_group_borrow_stream(bt_stream_class *stream_class, int64_t stream_id, |
303 | void *void_data) | |
f6e68e70 | 304 | { |
4164020e | 305 | struct ctf_fs_ds_group_medops_data *data = (struct ctf_fs_ds_group_medops_data *) void_data; |
f6e68e70 | 306 | |
4164020e | 307 | return medop_borrow_stream(stream_class, stream_id, data->file); |
f6e68e70 SM |
308 | } |
309 | ||
310 | /* | |
311 | * Set `data->file` to prepare it to read the packet described | |
312 | * by `index_entry`. | |
313 | */ | |
314 | ||
4164020e SM |
315 | static enum ctf_msg_iter_medium_status |
316 | ctf_fs_ds_group_medops_set_file(struct ctf_fs_ds_group_medops_data *data, | |
0f5c5d5c | 317 | struct ctf_fs_ds_index_entry *index_entry) |
f6e68e70 | 318 | { |
4164020e SM |
319 | enum ctf_msg_iter_medium_status status; |
320 | ||
321 | BT_ASSERT(data); | |
322 | BT_ASSERT(index_entry); | |
323 | ||
324 | /* Check if that file is already the one mapped. */ | |
a39d9817 | 325 | if (!data->file || data->file->file->path != index_entry->path) { |
4164020e | 326 | /* Destroy the previously used file. */ |
3199f1ba | 327 | delete data->file; |
4164020e SM |
328 | |
329 | /* Create the new file. */ | |
265d4ba2 SM |
330 | data->file = |
331 | ctf_fs_ds_file_create(data->ds_file_group->ctf_fs_trace, data->ds_file_group->stream, | |
89f88383 SM |
332 | index_entry->path, data->logger) |
333 | .release(); | |
4164020e | 334 | if (!data->file) { |
0f5c5d5c | 335 | BT_CPPLOGE_APPEND_CAUSE_SPEC(data->logger, "failed to create ctf_fs_ds_file."); |
4164020e SM |
336 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
337 | goto end; | |
338 | } | |
339 | } | |
340 | ||
341 | /* | |
342 | * Ensure the right portion of the file will be returned on the next | |
343 | * request_bytes call. | |
344 | */ | |
ef7d7ac2 | 345 | status = ds_file_mmap(data->file, index_entry->offset.bytes()); |
4164020e SM |
346 | if (status != CTF_MSG_ITER_MEDIUM_STATUS_OK) { |
347 | goto end; | |
348 | } | |
349 | ||
350 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
f6e68e70 SM |
351 | |
352 | end: | |
4164020e | 353 | return status; |
f6e68e70 SM |
354 | } |
355 | ||
4164020e | 356 | static enum ctf_msg_iter_medium_status medop_group_switch_packet(void *void_data) |
f6e68e70 | 357 | { |
4164020e SM |
358 | struct ctf_fs_ds_group_medops_data *data = (struct ctf_fs_ds_group_medops_data *) void_data; |
359 | struct ctf_fs_ds_index_entry *index_entry; | |
360 | enum ctf_msg_iter_medium_status status; | |
361 | ||
362 | /* If we have gone through all index entries, we are done. */ | |
2fb7af12 | 363 | if (data->next_index_entry_index >= data->ds_file_group->index->entries.size()) { |
4164020e SM |
364 | status = CTF_MSG_ITER_MEDIUM_STATUS_EOF; |
365 | goto end; | |
366 | } | |
367 | ||
368 | /* | |
369 | * Otherwise, look up the next index entry / packet and prepare it | |
370 | * for reading. | |
371 | */ | |
2fb7af12 | 372 | index_entry = data->ds_file_group->index->entries[data->next_index_entry_index].get(); |
4164020e | 373 | |
0f5c5d5c | 374 | status = ctf_fs_ds_group_medops_set_file(data, index_entry); |
4164020e SM |
375 | if (status != CTF_MSG_ITER_MEDIUM_STATUS_OK) { |
376 | goto end; | |
377 | } | |
378 | ||
379 | data->next_index_entry_index++; | |
380 | ||
381 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
f6e68e70 | 382 | end: |
4164020e | 383 | return status; |
f6e68e70 SM |
384 | } |
385 | ||
4164020e | 386 | void ctf_fs_ds_group_medops_data_destroy(struct ctf_fs_ds_group_medops_data *data) |
f6e68e70 | 387 | { |
4164020e SM |
388 | if (!data) { |
389 | goto end; | |
390 | } | |
f6e68e70 | 391 | |
3199f1ba | 392 | delete data->file; |
f6e68e70 | 393 | |
afb0f12b | 394 | delete data; |
f6e68e70 SM |
395 | |
396 | end: | |
4164020e | 397 | return; |
f6e68e70 SM |
398 | } |
399 | ||
400 | enum ctf_msg_iter_medium_status ctf_fs_ds_group_medops_data_create( | |
4164020e | 401 | struct ctf_fs_ds_file_group *ds_file_group, bt_self_message_iterator *self_msg_iter, |
0f5c5d5c | 402 | const bt2c::Logger& parentLogger, struct ctf_fs_ds_group_medops_data **out) |
f6e68e70 | 403 | { |
4164020e SM |
404 | BT_ASSERT(self_msg_iter); |
405 | BT_ASSERT(ds_file_group); | |
406 | BT_ASSERT(ds_file_group->index); | |
2fb7af12 | 407 | BT_ASSERT(!ds_file_group->index->entries.empty()); |
4164020e | 408 | |
0f5c5d5c | 409 | ctf_fs_ds_group_medops_data *data = new ctf_fs_ds_group_medops_data {parentLogger}; |
4164020e SM |
410 | data->ds_file_group = ds_file_group; |
411 | data->self_msg_iter = self_msg_iter; | |
4164020e SM |
412 | |
413 | /* | |
414 | * No need to prepare the first file. ctf_msg_iter will call | |
415 | * switch_packet before reading the first packet, it will be | |
416 | * done then. | |
417 | */ | |
418 | ||
419 | *out = data; | |
afb0f12b | 420 | return CTF_MSG_ITER_MEDIUM_STATUS_OK; |
f6e68e70 SM |
421 | } |
422 | ||
423 | void ctf_fs_ds_group_medops_data_reset(struct ctf_fs_ds_group_medops_data *data) | |
424 | { | |
4164020e | 425 | data->next_index_entry_index = 0; |
f6e68e70 SM |
426 | } |
427 | ||
428 | struct ctf_msg_iter_medium_ops ctf_fs_ds_group_medops = { | |
4164020e | 429 | .request_bytes = medop_group_request_bytes, |
f6e68e70 | 430 | |
4164020e SM |
431 | /* |
432 | * We don't support seeking using this medops. It would probably be | |
433 | * possible, but it's not needed at the moment. | |
434 | */ | |
435 | .seek = NULL, | |
087cd0f5 | 436 | |
4164020e SM |
437 | .switch_packet = medop_group_switch_packet, |
438 | .borrow_stream = medop_group_borrow_stream, | |
f6e68e70 SM |
439 | }; |
440 | ||
c05e1405 SM |
441 | static ctf_fs_ds_index_entry::UP ctf_fs_ds_index_entry_create(const bt2c::DataLen offset, |
442 | const bt2c::DataLen packetSize) | |
afb0f12b | 443 | { |
c05e1405 | 444 | ctf_fs_ds_index_entry::UP entry = bt2s::make_unique<ctf_fs_ds_index_entry>(offset, packetSize); |
ef7d7ac2 | 445 | |
4164020e | 446 | entry->packet_seq_num = UINT64_MAX; |
6834784d | 447 | |
4164020e | 448 | return entry; |
6834784d SM |
449 | } |
450 | ||
4164020e | 451 | static int convert_cycles_to_ns(struct ctf_clock_class *clock_class, uint64_t cycles, int64_t *ns) |
b6c3dcb2 | 452 | { |
4164020e SM |
453 | return bt_util_clock_cycles_to_ns_from_origin(cycles, clock_class->frequency, |
454 | clock_class->offset_seconds, | |
455 | clock_class->offset_cycles, ns); | |
97ade20b JG |
456 | } |
457 | ||
441fa755 SM |
458 | static ctf_fs_ds_index::UP build_index_from_idx_file(struct ctf_fs_ds_file *ds_file, |
459 | struct ctf_fs_ds_file_info *file_info, | |
460 | struct ctf_msg_iter *msg_iter) | |
97ade20b | 461 | { |
4164020e SM |
462 | int ret; |
463 | gchar *directory = NULL; | |
464 | gchar *basename = NULL; | |
465 | GString *index_basename = NULL; | |
466 | gchar *index_file_path = NULL; | |
467 | GMappedFile *mapped_file = NULL; | |
468 | gsize filesize; | |
469 | const char *mmap_begin = NULL, *file_pos = NULL; | |
470 | const struct ctf_packet_index_file_hdr *header = NULL; | |
441fa755 | 471 | ctf_fs_ds_index::UP index; |
c05e1405 SM |
472 | ctf_fs_ds_index_entry::UP index_entry; |
473 | ctf_fs_ds_index_entry *prev_index_entry = NULL; | |
ef7d7ac2 | 474 | auto totalPacketsSize = bt2c::DataLen::fromBytes(0); |
4164020e SM |
475 | size_t file_index_entry_size; |
476 | size_t file_entry_count; | |
477 | size_t i; | |
478 | struct ctf_stream_class *sc; | |
479 | struct ctf_msg_iter_packet_properties props; | |
480 | uint32_t version_major, version_minor; | |
4164020e | 481 | |
0f5c5d5c | 482 | BT_CPPLOGI_SPEC(ds_file->logger, "Building index from .idx file of stream file {}", |
a39d9817 | 483 | ds_file->file->path); |
4164020e SM |
484 | ret = ctf_msg_iter_get_packet_properties(msg_iter, &props); |
485 | if (ret) { | |
0f5c5d5c SM |
486 | BT_CPPLOGI_STR_SPEC(ds_file->logger, |
487 | "Cannot read first packet's header and context fields."); | |
4164020e SM |
488 | goto error; |
489 | } | |
490 | ||
491 | sc = ctf_trace_class_borrow_stream_class_by_id(ds_file->metadata->tc, props.stream_class_id); | |
492 | BT_ASSERT(sc); | |
493 | if (!sc->default_clock_class) { | |
0f5c5d5c | 494 | BT_CPPLOGI_STR_SPEC(ds_file->logger, "Cannot find stream class's default clock class."); |
4164020e SM |
495 | goto error; |
496 | } | |
497 | ||
498 | /* Look for index file in relative path index/name.idx. */ | |
a39d9817 | 499 | basename = g_path_get_basename(ds_file->file->path.c_str()); |
4164020e | 500 | if (!basename) { |
0f5c5d5c | 501 | BT_CPPLOGE_SPEC(ds_file->logger, "Cannot get the basename of datastream file {}", |
a39d9817 | 502 | ds_file->file->path); |
4164020e SM |
503 | goto error; |
504 | } | |
505 | ||
a39d9817 | 506 | directory = g_path_get_dirname(ds_file->file->path.c_str()); |
4164020e | 507 | if (!directory) { |
0f5c5d5c | 508 | BT_CPPLOGE_SPEC(ds_file->logger, "Cannot get dirname of datastream file {}", |
a39d9817 | 509 | ds_file->file->path); |
4164020e SM |
510 | goto error; |
511 | } | |
512 | ||
513 | index_basename = g_string_new(basename); | |
514 | if (!index_basename) { | |
0f5c5d5c | 515 | BT_CPPLOGE_STR_SPEC(ds_file->logger, "Cannot allocate index file basename string"); |
4164020e SM |
516 | goto error; |
517 | } | |
518 | ||
519 | g_string_append(index_basename, ".idx"); | |
520 | index_file_path = g_build_filename(directory, "index", index_basename->str, NULL); | |
521 | mapped_file = g_mapped_file_new(index_file_path, FALSE, NULL); | |
522 | if (!mapped_file) { | |
0f5c5d5c | 523 | BT_CPPLOGD_SPEC(ds_file->logger, "Cannot create new mapped file {}", index_file_path); |
4164020e SM |
524 | goto error; |
525 | } | |
526 | ||
527 | /* | |
528 | * The g_mapped_file API limits us to 4GB files on 32-bit. | |
529 | * Traces with such large indexes have never been seen in the wild, | |
530 | * but this would need to be adjusted to support them. | |
531 | */ | |
532 | filesize = g_mapped_file_get_length(mapped_file); | |
533 | if (filesize < sizeof(*header)) { | |
0f5c5d5c SM |
534 | BT_CPPLOGW_SPEC(ds_file->logger, |
535 | "Invalid LTTng trace index file: " | |
536 | "file size ({} bytes) < header size ({} bytes)", | |
537 | filesize, sizeof(*header)); | |
4164020e SM |
538 | goto error; |
539 | } | |
540 | ||
541 | mmap_begin = g_mapped_file_get_contents(mapped_file); | |
542 | header = (struct ctf_packet_index_file_hdr *) mmap_begin; | |
543 | ||
544 | file_pos = g_mapped_file_get_contents(mapped_file) + sizeof(*header); | |
545 | if (be32toh(header->magic) != CTF_INDEX_MAGIC) { | |
0f5c5d5c SM |
546 | BT_CPPLOGW_STR_SPEC(ds_file->logger, |
547 | "Invalid LTTng trace index: \"magic\" field validation failed"); | |
4164020e SM |
548 | goto error; |
549 | } | |
550 | ||
551 | version_major = be32toh(header->index_major); | |
552 | version_minor = be32toh(header->index_minor); | |
553 | if (version_major != 1) { | |
0f5c5d5c SM |
554 | BT_CPPLOGW_SPEC(ds_file->logger, "Unknown LTTng trace index version: major={}, minor={}", |
555 | version_major, version_minor); | |
4164020e SM |
556 | goto error; |
557 | } | |
558 | ||
559 | file_index_entry_size = be32toh(header->packet_index_len); | |
560 | if (file_index_entry_size < CTF_INDEX_1_0_SIZE) { | |
0f5c5d5c SM |
561 | BT_CPPLOGW_SPEC( |
562 | ds_file->logger, | |
4164020e | 563 | "Invalid `packet_index_len` in LTTng trace index file (`packet_index_len` < CTF index 1.0 index entry size): " |
0f5c5d5c | 564 | "packet_index_len={}, CTF_INDEX_1_0_SIZE={}", |
4164020e SM |
565 | file_index_entry_size, CTF_INDEX_1_0_SIZE); |
566 | goto error; | |
567 | } | |
568 | ||
569 | file_entry_count = (filesize - sizeof(*header)) / file_index_entry_size; | |
570 | if ((filesize - sizeof(*header)) % file_index_entry_size) { | |
0f5c5d5c SM |
571 | BT_CPPLOGW_SPEC(ds_file->logger, |
572 | "Invalid LTTng trace index: the index's size after the header " | |
573 | "({} bytes) is not a multiple of the index entry size " | |
574 | "({} bytes)", | |
575 | (filesize - sizeof(*header)), sizeof(*header)); | |
4164020e SM |
576 | goto error; |
577 | } | |
578 | ||
2fb7af12 | 579 | index = ctf_fs_ds_index_create(); |
4164020e SM |
580 | if (!index) { |
581 | goto error; | |
582 | } | |
583 | ||
584 | for (i = 0; i < file_entry_count; i++) { | |
585 | struct ctf_packet_index *file_index = (struct ctf_packet_index *) file_pos; | |
ef7d7ac2 | 586 | const auto packetSize = bt2c::DataLen::fromBits(be64toh(file_index->packet_size)); |
4164020e | 587 | |
ef7d7ac2 | 588 | if (packetSize.hasExtraBits()) { |
0f5c5d5c SM |
589 | BT_CPPLOGW_SPEC(ds_file->logger, |
590 | "Invalid packet size encountered in LTTng trace index file"); | |
4164020e SM |
591 | goto error; |
592 | } | |
593 | ||
ef7d7ac2 SM |
594 | const auto offset = bt2c::DataLen::fromBytes(be64toh(file_index->offset)); |
595 | ||
596 | if (i != 0 && offset < prev_index_entry->offset) { | |
597 | BT_CPPLOGW_SPEC( | |
598 | ds_file->logger, | |
599 | "Invalid, non-monotonic, packet offset encountered in LTTng trace index file: " | |
600 | "previous offset={} bytes, current offset={} bytes", | |
601 | prev_index_entry->offset.bytes(), offset.bytes()); | |
602 | goto error; | |
603 | } | |
604 | ||
605 | index_entry = ctf_fs_ds_index_entry_create(offset, packetSize); | |
4164020e | 606 | if (!index_entry) { |
0f5c5d5c SM |
607 | BT_CPPLOGE_APPEND_CAUSE_SPEC(ds_file->logger, |
608 | "Failed to create a ctf_fs_ds_index_entry."); | |
4164020e SM |
609 | goto error; |
610 | } | |
611 | ||
612 | /* Set path to stream file. */ | |
4d199954 | 613 | index_entry->path = file_info->path.c_str(); |
4164020e | 614 | |
4164020e SM |
615 | index_entry->timestamp_begin = be64toh(file_index->timestamp_begin); |
616 | index_entry->timestamp_end = be64toh(file_index->timestamp_end); | |
617 | if (index_entry->timestamp_end < index_entry->timestamp_begin) { | |
0f5c5d5c SM |
618 | BT_CPPLOGW_SPEC( |
619 | ds_file->logger, | |
4164020e | 620 | "Invalid packet time bounds encountered in LTTng trace index file (begin > end): " |
0f5c5d5c | 621 | "timestamp_begin={}, timestamp_end={}", |
4164020e SM |
622 | index_entry->timestamp_begin, index_entry->timestamp_end); |
623 | goto error; | |
624 | } | |
625 | ||
626 | /* Convert the packet's bound to nanoseconds since Epoch. */ | |
627 | ret = convert_cycles_to_ns(sc->default_clock_class, index_entry->timestamp_begin, | |
628 | &index_entry->timestamp_begin_ns); | |
629 | if (ret) { | |
0f5c5d5c SM |
630 | BT_CPPLOGI_STR_SPEC( |
631 | ds_file->logger, | |
4164020e SM |
632 | "Failed to convert raw timestamp to nanoseconds since Epoch during index parsing"); |
633 | goto error; | |
634 | } | |
635 | ret = convert_cycles_to_ns(sc->default_clock_class, index_entry->timestamp_end, | |
636 | &index_entry->timestamp_end_ns); | |
637 | if (ret) { | |
0f5c5d5c SM |
638 | BT_CPPLOGI_STR_SPEC( |
639 | ds_file->logger, | |
4164020e SM |
640 | "Failed to convert raw timestamp to nanoseconds since Epoch during LTTng trace index parsing"); |
641 | goto error; | |
642 | } | |
643 | ||
644 | if (version_minor >= 1) { | |
645 | index_entry->packet_seq_num = be64toh(file_index->packet_seq_num); | |
646 | } | |
647 | ||
ef7d7ac2 | 648 | totalPacketsSize += packetSize; |
4164020e SM |
649 | file_pos += file_index_entry_size; |
650 | ||
c05e1405 | 651 | prev_index_entry = index_entry.get(); |
4164020e | 652 | |
2fb7af12 | 653 | index->entries.emplace_back(std::move(index_entry)); |
4164020e SM |
654 | } |
655 | ||
656 | /* Validate that the index addresses the complete stream. */ | |
ef7d7ac2 | 657 | if (ds_file->file->size != totalPacketsSize.bytes()) { |
0f5c5d5c SM |
658 | BT_CPPLOGW_SPEC(ds_file->logger, |
659 | "Invalid LTTng trace index file; indexed size != stream file size: " | |
ef7d7ac2 SM |
660 | "file-size={} bytes, total-packets-size={} bytes", |
661 | ds_file->file->size, totalPacketsSize.bytes()); | |
4164020e SM |
662 | goto error; |
663 | } | |
b6c3dcb2 | 664 | end: |
4164020e SM |
665 | g_free(directory); |
666 | g_free(basename); | |
667 | g_free(index_file_path); | |
668 | if (index_basename) { | |
669 | g_string_free(index_basename, TRUE); | |
670 | } | |
671 | if (mapped_file) { | |
672 | g_mapped_file_unref(mapped_file); | |
673 | } | |
674 | return index; | |
97ade20b | 675 | error: |
441fa755 | 676 | index.reset(); |
4164020e | 677 | goto end; |
b6c3dcb2 JG |
678 | } |
679 | ||
4164020e | 680 | static int init_index_entry(struct ctf_fs_ds_index_entry *entry, struct ctf_fs_ds_file *ds_file, |
ef7d7ac2 | 681 | struct ctf_msg_iter_packet_properties *props) |
9e0c8dbb | 682 | { |
4164020e SM |
683 | int ret = 0; |
684 | struct ctf_stream_class *sc; | |
4164020e SM |
685 | |
686 | sc = ctf_trace_class_borrow_stream_class_by_id(ds_file->metadata->tc, props->stream_class_id); | |
687 | BT_ASSERT(sc); | |
4164020e SM |
688 | |
689 | if (props->snapshots.beginning_clock != UINT64_C(-1)) { | |
690 | entry->timestamp_begin = props->snapshots.beginning_clock; | |
691 | ||
692 | /* Convert the packet's bound to nanoseconds since Epoch. */ | |
693 | ret = convert_cycles_to_ns(sc->default_clock_class, props->snapshots.beginning_clock, | |
694 | &entry->timestamp_begin_ns); | |
695 | if (ret) { | |
0f5c5d5c SM |
696 | BT_CPPLOGI_STR_SPEC(ds_file->logger, |
697 | "Failed to convert raw timestamp to nanoseconds since Epoch."); | |
4164020e SM |
698 | goto end; |
699 | } | |
700 | } else { | |
701 | entry->timestamp_begin = UINT64_C(-1); | |
702 | entry->timestamp_begin_ns = UINT64_C(-1); | |
703 | } | |
704 | ||
705 | if (props->snapshots.end_clock != UINT64_C(-1)) { | |
706 | entry->timestamp_end = props->snapshots.end_clock; | |
707 | ||
708 | /* Convert the packet's bound to nanoseconds since Epoch. */ | |
709 | ret = convert_cycles_to_ns(sc->default_clock_class, props->snapshots.end_clock, | |
710 | &entry->timestamp_end_ns); | |
711 | if (ret) { | |
0f5c5d5c SM |
712 | BT_CPPLOGI_STR_SPEC(ds_file->logger, |
713 | "Failed to convert raw timestamp to nanoseconds since Epoch."); | |
4164020e SM |
714 | goto end; |
715 | } | |
716 | } else { | |
717 | entry->timestamp_end = UINT64_C(-1); | |
718 | entry->timestamp_end_ns = UINT64_C(-1); | |
719 | } | |
0b29603d | 720 | |
9e0c8dbb | 721 | end: |
4164020e | 722 | return ret; |
9e0c8dbb JG |
723 | } |
724 | ||
441fa755 SM |
725 | static ctf_fs_ds_index::UP build_index_from_stream_file(struct ctf_fs_ds_file *ds_file, |
726 | struct ctf_fs_ds_file_info *file_info, | |
727 | struct ctf_msg_iter *msg_iter) | |
9e0c8dbb | 728 | { |
4164020e | 729 | int ret; |
441fa755 | 730 | ctf_fs_ds_index::UP index; |
4164020e | 731 | enum ctf_msg_iter_status iter_status = CTF_MSG_ITER_STATUS_OK; |
ef7d7ac2 | 732 | auto currentPacketOffset = bt2c::DataLen::fromBytes(0); |
4164020e | 733 | |
a39d9817 | 734 | BT_CPPLOGI_SPEC(ds_file->logger, "Indexing stream file {}", ds_file->file->path); |
4164020e | 735 | |
2fb7af12 | 736 | index = ctf_fs_ds_index_create(); |
4164020e SM |
737 | if (!index) { |
738 | goto error; | |
739 | } | |
740 | ||
741 | while (true) { | |
4164020e SM |
742 | struct ctf_msg_iter_packet_properties props; |
743 | ||
ef7d7ac2 | 744 | if (currentPacketOffset.bytes() > ds_file->file->size) { |
0f5c5d5c SM |
745 | BT_CPPLOGE_STR_SPEC(ds_file->logger, |
746 | "Unexpected current packet's offset (larger than file)."); | |
4164020e | 747 | goto error; |
ef7d7ac2 | 748 | } else if (currentPacketOffset.bytes() == ds_file->file->size) { |
4164020e SM |
749 | /* No more data */ |
750 | break; | |
751 | } | |
752 | ||
ef7d7ac2 | 753 | iter_status = ctf_msg_iter_seek(msg_iter, currentPacketOffset.bytes()); |
4164020e SM |
754 | if (iter_status != CTF_MSG_ITER_STATUS_OK) { |
755 | goto error; | |
756 | } | |
757 | ||
758 | iter_status = ctf_msg_iter_get_packet_properties(msg_iter, &props); | |
759 | if (iter_status != CTF_MSG_ITER_STATUS_OK) { | |
760 | goto error; | |
761 | } | |
762 | ||
ef7d7ac2 SM |
763 | /* |
764 | * Get the current packet size from the packet header, if set. Else, | |
765 | * assume there is a single packet in the file, so take the file size | |
766 | * as the packet size. | |
767 | */ | |
768 | const auto currentPacketSize = props.exp_packet_total_size >= 0 ? | |
769 | bt2c::DataLen::fromBits(props.exp_packet_total_size) : | |
770 | bt2c::DataLen::fromBytes(ds_file->file->size); | |
4164020e | 771 | |
ef7d7ac2 | 772 | if ((currentPacketOffset + currentPacketSize).bytes() > ds_file->file->size) { |
0f5c5d5c SM |
773 | BT_CPPLOGW_SPEC(ds_file->logger, |
774 | "Invalid packet size reported in file: stream=\"{}\", " | |
ef7d7ac2 SM |
775 | "packet-offset-bytes={}, packet-size-bytes={}, " |
776 | "file-size-bytes={}", | |
a39d9817 | 777 | ds_file->file->path, currentPacketOffset.bytes(), |
ef7d7ac2 | 778 | currentPacketSize.bytes(), ds_file->file->size); |
4164020e SM |
779 | goto error; |
780 | } | |
781 | ||
c05e1405 | 782 | auto index_entry = ctf_fs_ds_index_entry_create(currentPacketOffset, currentPacketSize); |
4164020e | 783 | if (!index_entry) { |
0f5c5d5c SM |
784 | BT_CPPLOGE_APPEND_CAUSE_SPEC(ds_file->logger, |
785 | "Failed to create a ctf_fs_ds_index_entry."); | |
4164020e SM |
786 | goto error; |
787 | } | |
788 | ||
789 | /* Set path to stream file. */ | |
4d199954 | 790 | index_entry->path = file_info->path.c_str(); |
4164020e | 791 | |
c05e1405 | 792 | ret = init_index_entry(index_entry.get(), ds_file, &props); |
4164020e | 793 | if (ret) { |
4164020e SM |
794 | goto error; |
795 | } | |
796 | ||
2fb7af12 | 797 | index->entries.emplace_back(std::move(index_entry)); |
4164020e | 798 | |
ef7d7ac2 | 799 | currentPacketOffset += currentPacketSize; |
0f5c5d5c | 800 | BT_CPPLOGD_SPEC(ds_file->logger, |
ef7d7ac2 SM |
801 | "Seeking to next packet: current-packet-offset-bytes={}, " |
802 | "next-packet-offset-bytes={}", | |
803 | (currentPacketOffset - currentPacketSize).bytes(), | |
804 | currentPacketOffset.bytes()); | |
4164020e | 805 | } |
312c056a | 806 | |
9e0c8dbb | 807 | end: |
4164020e | 808 | return index; |
312c056a | 809 | |
9e0c8dbb | 810 | error: |
441fa755 | 811 | index.reset(); |
4164020e | 812 | goto end; |
9e0c8dbb JG |
813 | } |
814 | ||
89f88383 SM |
815 | ctf_fs_ds_file::UP ctf_fs_ds_file_create(struct ctf_fs_trace *ctf_fs_trace, |
816 | bt2::Stream::Shared stream, const char *path, | |
817 | const bt2c::Logger& parentLogger) | |
e98a2d6e | 818 | { |
4164020e | 819 | int ret; |
89f88383 | 820 | auto ds_file = bt2s::make_unique<ctf_fs_ds_file>(parentLogger); |
0f5c5d5c | 821 | size_t offset_align; |
4164020e | 822 | |
c44dc433 | 823 | ds_file->file = ctf_fs_file_create(parentLogger); |
4164020e SM |
824 | if (!ds_file->file) { |
825 | goto error; | |
826 | } | |
827 | ||
265d4ba2 | 828 | ds_file->stream = std::move(stream); |
4164020e | 829 | ds_file->metadata = ctf_fs_trace->metadata; |
a39d9817 | 830 | ds_file->file->path = path; |
c44dc433 | 831 | ret = ctf_fs_file_open(ds_file->file.get(), "rb"); |
4164020e SM |
832 | if (ret) { |
833 | goto error; | |
834 | } | |
835 | ||
0f5c5d5c | 836 | offset_align = bt_mmap_get_offset_align_size(static_cast<int>(ds_file->logger.level())); |
4164020e SM |
837 | ds_file->mmap_max_len = offset_align * 2048; |
838 | ||
839 | goto end; | |
1a9f7075 | 840 | |
e98a2d6e | 841 | error: |
4164020e | 842 | /* Do not touch "borrowed" file. */ |
89f88383 | 843 | ds_file.reset(); |
1a9f7075 | 844 | |
e98a2d6e | 845 | end: |
4164020e | 846 | return ds_file; |
e98a2d6e PP |
847 | } |
848 | ||
441fa755 SM |
849 | ctf_fs_ds_index::UP ctf_fs_ds_file_build_index(struct ctf_fs_ds_file *ds_file, |
850 | struct ctf_fs_ds_file_info *file_info, | |
851 | struct ctf_msg_iter *msg_iter) | |
97ade20b | 852 | { |
441fa755 | 853 | auto index = build_index_from_idx_file(ds_file, file_info, msg_iter); |
4164020e SM |
854 | if (index) { |
855 | goto end; | |
856 | } | |
857 | ||
0f5c5d5c SM |
858 | BT_CPPLOGI_SPEC(ds_file->logger, "Failed to build index from .index file; " |
859 | "falling back to stream indexing."); | |
4164020e | 860 | index = build_index_from_stream_file(ds_file, file_info, msg_iter); |
9e0c8dbb | 861 | end: |
4164020e | 862 | return index; |
97ade20b JG |
863 | } |
864 | ||
2fb7af12 | 865 | ctf_fs_ds_index::UP ctf_fs_ds_index_create() |
7ed5243a | 866 | { |
bfd852f0 | 867 | return bt2s::make_unique<ctf_fs_ds_index>(); |
7ed5243a FD |
868 | } |
869 | ||
3199f1ba | 870 | ctf_fs_ds_file::~ctf_fs_ds_file() |
e98a2d6e | 871 | { |
3199f1ba | 872 | (void) ds_file_munmap(this); |
e98a2d6e | 873 | } |
4f1f88a6 | 874 | |
2cef6403 | 875 | ctf_fs_ds_file_info::UP ctf_fs_ds_file_info_create(const char *path, int64_t begin_ns) |
873c329a | 876 | { |
2cef6403 | 877 | ctf_fs_ds_file_info::UP ds_file_info = bt2s::make_unique<ctf_fs_ds_file_info>(); |
873c329a | 878 | |
4d199954 | 879 | ds_file_info->path = path; |
873c329a | 880 | ds_file_info->begin_ns = begin_ns; |
873c329a SM |
881 | return ds_file_info; |
882 | } | |
883 | ||
fe2e19c4 SM |
884 | ctf_fs_ds_file_group::UP ctf_fs_ds_file_group_create(struct ctf_fs_trace *ctf_fs_trace, |
885 | struct ctf_stream_class *sc, | |
886 | uint64_t stream_instance_id, | |
fe2f9cda | 887 | ctf_fs_ds_index::UP index) |
fe2e19c4 SM |
888 | { |
889 | ctf_fs_ds_file_group::UP ds_file_group {new ctf_fs_ds_file_group}; | |
890 | ||
fe2f9cda | 891 | ds_file_group->index = std::move(index); |
873c329a SM |
892 | |
893 | ds_file_group->stream_id = stream_instance_id; | |
894 | BT_ASSERT(sc); | |
895 | ds_file_group->sc = sc; | |
896 | ds_file_group->ctf_fs_trace = ctf_fs_trace; | |
873c329a | 897 | |
873c329a SM |
898 | return ds_file_group; |
899 | } |