Commit | Line | Data |
---|---|---|
e98a2d6e | 1 | /* |
0235b0db | 2 | * SPDX-License-Identifier: MIT |
e98a2d6e | 3 | * |
0235b0db MJ |
4 | * Copyright 2016-2017 Philippe Proulx <pproulx@efficios.com> |
5 | * Copyright 2016 Jérémie Galarneau <jeremie.galarneau@efficios.com> | |
6 | * Copyright 2010-2011 EfficiOS Inc. and Linux Foundation | |
e98a2d6e PP |
7 | */ |
8 | ||
c802cacb | 9 | #include <glib.h> |
c802cacb SM |
10 | #include <stdint.h> |
11 | #include <stdio.h> | |
c802cacb | 12 | |
83ad336c | 13 | #include "compat/endian.h" /* IWYU pragma: keep */ |
0f5c5d5c | 14 | #include "compat/mman.h" /* IWYU: pragma keep */ |
2cef6403 | 15 | #include "cpp-common/bt2s/make-unique.hpp" |
0f5c5d5c | 16 | #include "cpp-common/vendor/fmt/format.h" |
c802cacb | 17 | |
5656cea5 | 18 | #include "../common/src/msg-iter/msg-iter.hpp" |
087cd0f5 | 19 | #include "data-stream-file.hpp" |
c802cacb | 20 | #include "file.hpp" |
c7e1be4b SM |
21 | #include "fs.hpp" |
22 | #include "lttng-index.hpp" | |
e98a2d6e | 23 | |
4164020e | 24 | static inline size_t remaining_mmap_bytes(struct ctf_fs_ds_file *ds_file) |
e98a2d6e | 25 | { |
4164020e SM |
26 | BT_ASSERT_DBG(ds_file->mmap_len >= ds_file->request_offset_in_mapping); |
27 | return ds_file->mmap_len - ds_file->request_offset_in_mapping; | |
e98a2d6e PP |
28 | } |
29 | ||
127e2341 SM |
30 | /* |
31 | * Return true if `offset_in_file` is in the current mapping. | |
32 | */ | |
33 | ||
4164020e | 34 | static bool offset_ist_mapped(struct ctf_fs_ds_file *ds_file, off_t offset_in_file) |
127e2341 | 35 | { |
4164020e SM |
36 | return offset_in_file >= ds_file->mmap_offset_in_file && |
37 | offset_in_file < (ds_file->mmap_offset_in_file + ds_file->mmap_len); | |
127e2341 SM |
38 | } |
39 | ||
4164020e | 40 | static enum ctf_msg_iter_medium_status ds_file_munmap(struct ctf_fs_ds_file *ds_file) |
e98a2d6e | 41 | { |
4164020e | 42 | enum ctf_msg_iter_medium_status status; |
4164020e SM |
43 | |
44 | BT_ASSERT(ds_file); | |
45 | ||
46 | if (!ds_file->mmap_addr) { | |
47 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
48 | goto end; | |
49 | } | |
50 | ||
51 | if (bt_munmap(ds_file->mmap_addr, ds_file->mmap_len)) { | |
0f5c5d5c SM |
52 | BT_CPPLOGE_ERRNO_SPEC(ds_file->logger, "Cannot memory-unmap file", |
53 | ": address={}, size={}, file_path=\"{}\", file={}", | |
54 | fmt::ptr(ds_file->mmap_addr), ds_file->mmap_len, | |
a39d9817 | 55 | ds_file->file ? ds_file->file->path : "NULL", |
0f5c5d5c | 56 | ds_file->file ? fmt::ptr(ds_file->file->fp) : NULL); |
4164020e SM |
57 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
58 | goto end; | |
59 | } | |
60 | ||
61 | ds_file->mmap_addr = NULL; | |
62 | ||
63 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
fc9a526c | 64 | end: |
4164020e | 65 | return status; |
e98a2d6e PP |
66 | } |
67 | ||
127e2341 SM |
68 | /* |
69 | * mmap a region of `ds_file` such that `requested_offset_in_file` is in the | |
70 | * mapping. If the currently mmap-ed region already contains | |
71 | * `requested_offset_in_file`, the mapping is kept. | |
72 | * | |
f6e68e70 SM |
73 | * Set `ds_file->requested_offset_in_mapping` based on `request_offset_in_file`, |
74 | * such that the next call to `request_bytes` will return bytes starting at that | |
75 | * position. | |
127e2341 SM |
76 | * |
77 | * `requested_offset_in_file` must be a valid offset in the file. | |
78 | */ | |
4164020e SM |
79 | static enum ctf_msg_iter_medium_status ds_file_mmap(struct ctf_fs_ds_file *ds_file, |
80 | off_t requested_offset_in_file) | |
e98a2d6e | 81 | { |
4164020e | 82 | enum ctf_msg_iter_medium_status status; |
4164020e SM |
83 | |
84 | /* Ensure the requested offset is in the file range. */ | |
85 | BT_ASSERT(requested_offset_in_file >= 0); | |
86 | BT_ASSERT(requested_offset_in_file < ds_file->file->size); | |
87 | ||
88 | /* | |
89 | * If the mapping already contains the requested offset, just adjust | |
90 | * requested_offset_in_mapping. | |
91 | */ | |
92 | if (offset_ist_mapped(ds_file, requested_offset_in_file)) { | |
93 | ds_file->request_offset_in_mapping = | |
94 | requested_offset_in_file - ds_file->mmap_offset_in_file; | |
95 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
96 | goto end; | |
97 | } | |
98 | ||
99 | /* Unmap old region */ | |
100 | status = ds_file_munmap(ds_file); | |
101 | if (status != CTF_MSG_ITER_MEDIUM_STATUS_OK) { | |
102 | goto end; | |
103 | } | |
104 | ||
105 | /* | |
106 | * Compute a mapping that has the required alignment properties and | |
107 | * contains `requested_offset_in_file`. | |
108 | */ | |
109 | ds_file->request_offset_in_mapping = | |
0f5c5d5c SM |
110 | requested_offset_in_file % |
111 | bt_mmap_get_offset_align_size(static_cast<int>(ds_file->logger.level())); | |
4164020e SM |
112 | ds_file->mmap_offset_in_file = requested_offset_in_file - ds_file->request_offset_in_mapping; |
113 | ds_file->mmap_len = | |
114 | MIN(ds_file->file->size - ds_file->mmap_offset_in_file, ds_file->mmap_max_len); | |
115 | ||
116 | BT_ASSERT(ds_file->mmap_len > 0); | |
117 | ||
118 | ds_file->mmap_addr = | |
85a25425 | 119 | bt_mmap(ds_file->mmap_len, PROT_READ, MAP_PRIVATE, fileno(ds_file->file->fp.get()), |
0f5c5d5c | 120 | ds_file->mmap_offset_in_file, static_cast<int>(ds_file->logger.level())); |
4164020e | 121 | if (ds_file->mmap_addr == MAP_FAILED) { |
0f5c5d5c SM |
122 | BT_CPPLOGE_SPEC(ds_file->logger, |
123 | "Cannot memory-map address (size {}) of file \"{}\" ({}) at offset {}: {}", | |
a39d9817 | 124 | ds_file->mmap_len, ds_file->file->path, fmt::ptr(ds_file->file->fp), |
0f5c5d5c | 125 | (intmax_t) ds_file->mmap_offset_in_file, strerror(errno)); |
4164020e SM |
126 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
127 | goto end; | |
128 | } | |
129 | ||
130 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
127e2341 SM |
131 | |
132 | end: | |
4164020e | 133 | return status; |
127e2341 SM |
134 | } |
135 | ||
136 | /* | |
137 | * Change the mapping of the file to read the region that follows the current | |
138 | * mapping. | |
139 | * | |
140 | * If the file hasn't been mapped yet, then everything (mmap_offset_in_file, | |
141 | * mmap_len, request_offset_in_mapping) should have the value 0, which will | |
142 | * result in the beginning of the file getting mapped. | |
143 | * | |
144 | * return _EOF if the current mapping is the end of the file. | |
145 | */ | |
146 | ||
4164020e | 147 | static enum ctf_msg_iter_medium_status ds_file_mmap_next(struct ctf_fs_ds_file *ds_file) |
127e2341 | 148 | { |
4164020e SM |
149 | enum ctf_msg_iter_medium_status status; |
150 | ||
151 | /* | |
152 | * If we're called, it's because more bytes are requested but we have | |
153 | * given all the bytes of the current mapping. | |
154 | */ | |
155 | BT_ASSERT(ds_file->request_offset_in_mapping == ds_file->mmap_len); | |
156 | ||
157 | /* | |
158 | * If the current mapping coincides with the end of the file, there is | |
159 | * no next mapping. | |
160 | */ | |
161 | if (ds_file->mmap_offset_in_file + ds_file->mmap_len == ds_file->file->size) { | |
162 | status = CTF_MSG_ITER_MEDIUM_STATUS_EOF; | |
163 | goto end; | |
164 | } | |
165 | ||
166 | status = ds_file_mmap(ds_file, ds_file->mmap_offset_in_file + ds_file->mmap_len); | |
127e2341 | 167 | |
e98a2d6e | 168 | end: |
4164020e | 169 | return status; |
e98a2d6e PP |
170 | } |
171 | ||
4164020e SM |
172 | static enum ctf_msg_iter_medium_status medop_request_bytes(size_t request_sz, uint8_t **buffer_addr, |
173 | size_t *buffer_sz, void *data) | |
e98a2d6e | 174 | { |
4164020e SM |
175 | enum ctf_msg_iter_medium_status status = CTF_MSG_ITER_MEDIUM_STATUS_OK; |
176 | struct ctf_fs_ds_file *ds_file = (struct ctf_fs_ds_file *) data; | |
4164020e SM |
177 | |
178 | BT_ASSERT(request_sz > 0); | |
179 | ||
180 | /* | |
181 | * Check if we have at least one memory-mapped byte left. If we don't, | |
182 | * mmap the next file. | |
183 | */ | |
184 | if (remaining_mmap_bytes(ds_file) == 0) { | |
185 | /* Are we at the end of the file? */ | |
186 | if (ds_file->mmap_offset_in_file >= ds_file->file->size) { | |
a39d9817 SM |
187 | BT_CPPLOGD_SPEC(ds_file->logger, "Reached end of file \"{}\" ({})", ds_file->file->path, |
188 | fmt::ptr(ds_file->file->fp)); | |
4164020e SM |
189 | status = CTF_MSG_ITER_MEDIUM_STATUS_EOF; |
190 | goto end; | |
191 | } | |
192 | ||
193 | status = ds_file_mmap_next(ds_file); | |
194 | switch (status) { | |
195 | case CTF_MSG_ITER_MEDIUM_STATUS_OK: | |
196 | break; | |
197 | case CTF_MSG_ITER_MEDIUM_STATUS_EOF: | |
198 | goto end; | |
199 | default: | |
0f5c5d5c | 200 | BT_CPPLOGE_SPEC(ds_file->logger, "Cannot memory-map next region of file \"{}\" ({})", |
a39d9817 | 201 | ds_file->file->path, fmt::ptr(ds_file->file->fp)); |
4164020e SM |
202 | goto error; |
203 | } | |
204 | } | |
205 | ||
206 | BT_ASSERT(remaining_mmap_bytes(ds_file) > 0); | |
207 | *buffer_sz = MIN(remaining_mmap_bytes(ds_file), request_sz); | |
208 | ||
209 | BT_ASSERT(ds_file->mmap_addr); | |
210 | *buffer_addr = ((uint8_t *) ds_file->mmap_addr) + ds_file->request_offset_in_mapping; | |
211 | ||
212 | ds_file->request_offset_in_mapping += *buffer_sz; | |
213 | goto end; | |
e98a2d6e PP |
214 | |
215 | error: | |
4164020e | 216 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
e98a2d6e PP |
217 | |
218 | end: | |
4164020e | 219 | return status; |
e98a2d6e PP |
220 | } |
221 | ||
ecd7492f | 222 | static bt_stream *medop_borrow_stream(bt_stream_class *stream_class, int64_t, void *data) |
e98a2d6e | 223 | { |
4164020e SM |
224 | struct ctf_fs_ds_file *ds_file = (struct ctf_fs_ds_file *) data; |
225 | bt_stream_class *ds_file_stream_class; | |
226 | bt_stream *stream = NULL; | |
e5be10ef | 227 | |
265d4ba2 | 228 | ds_file_stream_class = ds_file->stream->cls().libObjPtr(); |
94cf822e | 229 | |
4164020e SM |
230 | if (stream_class != ds_file_stream_class) { |
231 | /* | |
232 | * Not supported: two packets described by two different | |
233 | * stream classes within the same data stream file. | |
234 | */ | |
235 | goto end; | |
236 | } | |
e98a2d6e | 237 | |
265d4ba2 | 238 | stream = ds_file->stream->libObjPtr(); |
94cf822e PP |
239 | |
240 | end: | |
4164020e | 241 | return stream; |
e98a2d6e PP |
242 | } |
243 | ||
4164020e | 244 | static enum ctf_msg_iter_medium_status medop_seek(off_t offset, void *data) |
9e0c8dbb | 245 | { |
4164020e | 246 | struct ctf_fs_ds_file *ds_file = (struct ctf_fs_ds_file *) data; |
9e0c8dbb | 247 | |
4164020e SM |
248 | BT_ASSERT(offset >= 0); |
249 | BT_ASSERT(offset < ds_file->file->size); | |
9e0c8dbb | 250 | |
4164020e | 251 | return ds_file_mmap(ds_file, offset); |
9e0c8dbb JG |
252 | } |
253 | ||
18a1979b | 254 | struct ctf_msg_iter_medium_ops ctf_fs_ds_file_medops = { |
4164020e SM |
255 | medop_request_bytes, |
256 | medop_seek, | |
257 | nullptr, | |
258 | medop_borrow_stream, | |
e98a2d6e | 259 | }; |
6de92955 | 260 | |
4164020e SM |
261 | struct ctf_fs_ds_group_medops_data |
262 | { | |
0f5c5d5c SM |
263 | explicit ctf_fs_ds_group_medops_data(const bt2c::Logger& parentLogger) : |
264 | logger {parentLogger, "PLUGIN/SRC.CTF.FS/DS-GROUP-MEDOPS"} | |
265 | { | |
266 | } | |
267 | ||
268 | bt2c::Logger logger; | |
269 | ||
4164020e | 270 | /* Weak, set once at creation time. */ |
afb0f12b | 271 | struct ctf_fs_ds_file_group *ds_file_group = nullptr; |
4164020e SM |
272 | |
273 | /* | |
274 | * Index (as in element rank) of the index entry of ds_file_groups' | |
275 | * index we will read next (so, the one after the one we are reading | |
276 | * right now). | |
277 | */ | |
afb0f12b | 278 | guint next_index_entry_index = 0; |
4164020e SM |
279 | |
280 | /* | |
281 | * File we are currently reading. Changes whenever we switch to | |
282 | * reading another data file. | |
4164020e | 283 | */ |
55ea683f | 284 | ctf_fs_ds_file::UP file; |
4164020e SM |
285 | |
286 | /* Weak, for context / logging / appending causes. */ | |
afb0f12b | 287 | bt_self_message_iterator *self_msg_iter = nullptr; |
f6e68e70 SM |
288 | }; |
289 | ||
4164020e SM |
290 | static enum ctf_msg_iter_medium_status medop_group_request_bytes(size_t request_sz, |
291 | uint8_t **buffer_addr, | |
292 | size_t *buffer_sz, void *void_data) | |
f6e68e70 | 293 | { |
4164020e | 294 | struct ctf_fs_ds_group_medops_data *data = (struct ctf_fs_ds_group_medops_data *) void_data; |
f6e68e70 | 295 | |
4164020e | 296 | /* Return bytes from the current file. */ |
55ea683f | 297 | return medop_request_bytes(request_sz, buffer_addr, buffer_sz, data->file.get()); |
f6e68e70 SM |
298 | } |
299 | ||
4164020e SM |
300 | static bt_stream *medop_group_borrow_stream(bt_stream_class *stream_class, int64_t stream_id, |
301 | void *void_data) | |
f6e68e70 | 302 | { |
4164020e | 303 | struct ctf_fs_ds_group_medops_data *data = (struct ctf_fs_ds_group_medops_data *) void_data; |
f6e68e70 | 304 | |
55ea683f | 305 | return medop_borrow_stream(stream_class, stream_id, data->file.get()); |
f6e68e70 SM |
306 | } |
307 | ||
308 | /* | |
309 | * Set `data->file` to prepare it to read the packet described | |
310 | * by `index_entry`. | |
311 | */ | |
312 | ||
4164020e SM |
313 | static enum ctf_msg_iter_medium_status |
314 | ctf_fs_ds_group_medops_set_file(struct ctf_fs_ds_group_medops_data *data, | |
0f5c5d5c | 315 | struct ctf_fs_ds_index_entry *index_entry) |
f6e68e70 | 316 | { |
4164020e SM |
317 | enum ctf_msg_iter_medium_status status; |
318 | ||
319 | BT_ASSERT(data); | |
320 | BT_ASSERT(index_entry); | |
321 | ||
322 | /* Check if that file is already the one mapped. */ | |
a39d9817 | 323 | if (!data->file || data->file->file->path != index_entry->path) { |
4164020e | 324 | /* Create the new file. */ |
265d4ba2 SM |
325 | data->file = |
326 | ctf_fs_ds_file_create(data->ds_file_group->ctf_fs_trace, data->ds_file_group->stream, | |
55ea683f | 327 | index_entry->path, data->logger); |
4164020e | 328 | if (!data->file) { |
0f5c5d5c | 329 | BT_CPPLOGE_APPEND_CAUSE_SPEC(data->logger, "failed to create ctf_fs_ds_file."); |
4164020e SM |
330 | status = CTF_MSG_ITER_MEDIUM_STATUS_ERROR; |
331 | goto end; | |
332 | } | |
333 | } | |
334 | ||
335 | /* | |
336 | * Ensure the right portion of the file will be returned on the next | |
337 | * request_bytes call. | |
338 | */ | |
55ea683f | 339 | status = ds_file_mmap(data->file.get(), index_entry->offset.bytes()); |
4164020e SM |
340 | if (status != CTF_MSG_ITER_MEDIUM_STATUS_OK) { |
341 | goto end; | |
342 | } | |
343 | ||
344 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
f6e68e70 SM |
345 | |
346 | end: | |
4164020e | 347 | return status; |
f6e68e70 SM |
348 | } |
349 | ||
4164020e | 350 | static enum ctf_msg_iter_medium_status medop_group_switch_packet(void *void_data) |
f6e68e70 | 351 | { |
4164020e SM |
352 | struct ctf_fs_ds_group_medops_data *data = (struct ctf_fs_ds_group_medops_data *) void_data; |
353 | struct ctf_fs_ds_index_entry *index_entry; | |
354 | enum ctf_msg_iter_medium_status status; | |
355 | ||
356 | /* If we have gone through all index entries, we are done. */ | |
2fb7af12 | 357 | if (data->next_index_entry_index >= data->ds_file_group->index->entries.size()) { |
4164020e SM |
358 | status = CTF_MSG_ITER_MEDIUM_STATUS_EOF; |
359 | goto end; | |
360 | } | |
361 | ||
362 | /* | |
363 | * Otherwise, look up the next index entry / packet and prepare it | |
364 | * for reading. | |
365 | */ | |
2fb7af12 | 366 | index_entry = data->ds_file_group->index->entries[data->next_index_entry_index].get(); |
4164020e | 367 | |
0f5c5d5c | 368 | status = ctf_fs_ds_group_medops_set_file(data, index_entry); |
4164020e SM |
369 | if (status != CTF_MSG_ITER_MEDIUM_STATUS_OK) { |
370 | goto end; | |
371 | } | |
372 | ||
373 | data->next_index_entry_index++; | |
374 | ||
375 | status = CTF_MSG_ITER_MEDIUM_STATUS_OK; | |
f6e68e70 | 376 | end: |
4164020e | 377 | return status; |
f6e68e70 SM |
378 | } |
379 | ||
3cf88182 SM |
380 | void ctf_fs_ds_group_medops_data_deleter::operator()(ctf_fs_ds_group_medops_data *data) noexcept |
381 | { | |
2db013e0 | 382 | delete data; |
3cf88182 SM |
383 | } |
384 | ||
f6e68e70 | 385 | enum ctf_msg_iter_medium_status ctf_fs_ds_group_medops_data_create( |
4164020e | 386 | struct ctf_fs_ds_file_group *ds_file_group, bt_self_message_iterator *self_msg_iter, |
3cf88182 | 387 | const bt2c::Logger& parentLogger, ctf_fs_ds_group_medops_data_up& out) |
f6e68e70 | 388 | { |
4164020e SM |
389 | BT_ASSERT(self_msg_iter); |
390 | BT_ASSERT(ds_file_group); | |
391 | BT_ASSERT(ds_file_group->index); | |
2fb7af12 | 392 | BT_ASSERT(!ds_file_group->index->entries.empty()); |
4164020e | 393 | |
3cf88182 SM |
394 | out.reset(new ctf_fs_ds_group_medops_data {parentLogger}); |
395 | ||
396 | out->ds_file_group = ds_file_group; | |
397 | out->self_msg_iter = self_msg_iter; | |
4164020e SM |
398 | |
399 | /* | |
400 | * No need to prepare the first file. ctf_msg_iter will call | |
401 | * switch_packet before reading the first packet, it will be | |
402 | * done then. | |
403 | */ | |
404 | ||
afb0f12b | 405 | return CTF_MSG_ITER_MEDIUM_STATUS_OK; |
f6e68e70 SM |
406 | } |
407 | ||
408 | void ctf_fs_ds_group_medops_data_reset(struct ctf_fs_ds_group_medops_data *data) | |
409 | { | |
4164020e | 410 | data->next_index_entry_index = 0; |
f6e68e70 SM |
411 | } |
412 | ||
413 | struct ctf_msg_iter_medium_ops ctf_fs_ds_group_medops = { | |
4164020e | 414 | .request_bytes = medop_group_request_bytes, |
f6e68e70 | 415 | |
4164020e SM |
416 | /* |
417 | * We don't support seeking using this medops. It would probably be | |
418 | * possible, but it's not needed at the moment. | |
419 | */ | |
420 | .seek = NULL, | |
087cd0f5 | 421 | |
4164020e SM |
422 | .switch_packet = medop_group_switch_packet, |
423 | .borrow_stream = medop_group_borrow_stream, | |
f6e68e70 SM |
424 | }; |
425 | ||
c05e1405 SM |
426 | static ctf_fs_ds_index_entry::UP ctf_fs_ds_index_entry_create(const bt2c::DataLen offset, |
427 | const bt2c::DataLen packetSize) | |
afb0f12b | 428 | { |
c05e1405 | 429 | ctf_fs_ds_index_entry::UP entry = bt2s::make_unique<ctf_fs_ds_index_entry>(offset, packetSize); |
ef7d7ac2 | 430 | |
4164020e | 431 | entry->packet_seq_num = UINT64_MAX; |
6834784d | 432 | |
4164020e | 433 | return entry; |
6834784d SM |
434 | } |
435 | ||
4164020e | 436 | static int convert_cycles_to_ns(struct ctf_clock_class *clock_class, uint64_t cycles, int64_t *ns) |
b6c3dcb2 | 437 | { |
4164020e SM |
438 | return bt_util_clock_cycles_to_ns_from_origin(cycles, clock_class->frequency, |
439 | clock_class->offset_seconds, | |
440 | clock_class->offset_cycles, ns); | |
97ade20b JG |
441 | } |
442 | ||
441fa755 SM |
443 | static ctf_fs_ds_index::UP build_index_from_idx_file(struct ctf_fs_ds_file *ds_file, |
444 | struct ctf_fs_ds_file_info *file_info, | |
445 | struct ctf_msg_iter *msg_iter) | |
97ade20b | 446 | { |
4164020e SM |
447 | int ret; |
448 | gchar *directory = NULL; | |
449 | gchar *basename = NULL; | |
450 | GString *index_basename = NULL; | |
451 | gchar *index_file_path = NULL; | |
452 | GMappedFile *mapped_file = NULL; | |
453 | gsize filesize; | |
454 | const char *mmap_begin = NULL, *file_pos = NULL; | |
455 | const struct ctf_packet_index_file_hdr *header = NULL; | |
441fa755 | 456 | ctf_fs_ds_index::UP index; |
c05e1405 SM |
457 | ctf_fs_ds_index_entry::UP index_entry; |
458 | ctf_fs_ds_index_entry *prev_index_entry = NULL; | |
ef7d7ac2 | 459 | auto totalPacketsSize = bt2c::DataLen::fromBytes(0); |
4164020e SM |
460 | size_t file_index_entry_size; |
461 | size_t file_entry_count; | |
462 | size_t i; | |
463 | struct ctf_stream_class *sc; | |
464 | struct ctf_msg_iter_packet_properties props; | |
465 | uint32_t version_major, version_minor; | |
4164020e | 466 | |
0f5c5d5c | 467 | BT_CPPLOGI_SPEC(ds_file->logger, "Building index from .idx file of stream file {}", |
a39d9817 | 468 | ds_file->file->path); |
4164020e SM |
469 | ret = ctf_msg_iter_get_packet_properties(msg_iter, &props); |
470 | if (ret) { | |
0f5c5d5c SM |
471 | BT_CPPLOGI_STR_SPEC(ds_file->logger, |
472 | "Cannot read first packet's header and context fields."); | |
4164020e SM |
473 | goto error; |
474 | } | |
475 | ||
476 | sc = ctf_trace_class_borrow_stream_class_by_id(ds_file->metadata->tc, props.stream_class_id); | |
477 | BT_ASSERT(sc); | |
478 | if (!sc->default_clock_class) { | |
0f5c5d5c | 479 | BT_CPPLOGI_STR_SPEC(ds_file->logger, "Cannot find stream class's default clock class."); |
4164020e SM |
480 | goto error; |
481 | } | |
482 | ||
483 | /* Look for index file in relative path index/name.idx. */ | |
a39d9817 | 484 | basename = g_path_get_basename(ds_file->file->path.c_str()); |
4164020e | 485 | if (!basename) { |
0f5c5d5c | 486 | BT_CPPLOGE_SPEC(ds_file->logger, "Cannot get the basename of datastream file {}", |
a39d9817 | 487 | ds_file->file->path); |
4164020e SM |
488 | goto error; |
489 | } | |
490 | ||
a39d9817 | 491 | directory = g_path_get_dirname(ds_file->file->path.c_str()); |
4164020e | 492 | if (!directory) { |
0f5c5d5c | 493 | BT_CPPLOGE_SPEC(ds_file->logger, "Cannot get dirname of datastream file {}", |
a39d9817 | 494 | ds_file->file->path); |
4164020e SM |
495 | goto error; |
496 | } | |
497 | ||
498 | index_basename = g_string_new(basename); | |
499 | if (!index_basename) { | |
0f5c5d5c | 500 | BT_CPPLOGE_STR_SPEC(ds_file->logger, "Cannot allocate index file basename string"); |
4164020e SM |
501 | goto error; |
502 | } | |
503 | ||
504 | g_string_append(index_basename, ".idx"); | |
505 | index_file_path = g_build_filename(directory, "index", index_basename->str, NULL); | |
506 | mapped_file = g_mapped_file_new(index_file_path, FALSE, NULL); | |
507 | if (!mapped_file) { | |
0f5c5d5c | 508 | BT_CPPLOGD_SPEC(ds_file->logger, "Cannot create new mapped file {}", index_file_path); |
4164020e SM |
509 | goto error; |
510 | } | |
511 | ||
512 | /* | |
513 | * The g_mapped_file API limits us to 4GB files on 32-bit. | |
514 | * Traces with such large indexes have never been seen in the wild, | |
515 | * but this would need to be adjusted to support them. | |
516 | */ | |
517 | filesize = g_mapped_file_get_length(mapped_file); | |
518 | if (filesize < sizeof(*header)) { | |
0f5c5d5c SM |
519 | BT_CPPLOGW_SPEC(ds_file->logger, |
520 | "Invalid LTTng trace index file: " | |
521 | "file size ({} bytes) < header size ({} bytes)", | |
522 | filesize, sizeof(*header)); | |
4164020e SM |
523 | goto error; |
524 | } | |
525 | ||
526 | mmap_begin = g_mapped_file_get_contents(mapped_file); | |
527 | header = (struct ctf_packet_index_file_hdr *) mmap_begin; | |
528 | ||
529 | file_pos = g_mapped_file_get_contents(mapped_file) + sizeof(*header); | |
530 | if (be32toh(header->magic) != CTF_INDEX_MAGIC) { | |
0f5c5d5c SM |
531 | BT_CPPLOGW_STR_SPEC(ds_file->logger, |
532 | "Invalid LTTng trace index: \"magic\" field validation failed"); | |
4164020e SM |
533 | goto error; |
534 | } | |
535 | ||
536 | version_major = be32toh(header->index_major); | |
537 | version_minor = be32toh(header->index_minor); | |
538 | if (version_major != 1) { | |
0f5c5d5c SM |
539 | BT_CPPLOGW_SPEC(ds_file->logger, "Unknown LTTng trace index version: major={}, minor={}", |
540 | version_major, version_minor); | |
4164020e SM |
541 | goto error; |
542 | } | |
543 | ||
544 | file_index_entry_size = be32toh(header->packet_index_len); | |
545 | if (file_index_entry_size < CTF_INDEX_1_0_SIZE) { | |
0f5c5d5c SM |
546 | BT_CPPLOGW_SPEC( |
547 | ds_file->logger, | |
4164020e | 548 | "Invalid `packet_index_len` in LTTng trace index file (`packet_index_len` < CTF index 1.0 index entry size): " |
0f5c5d5c | 549 | "packet_index_len={}, CTF_INDEX_1_0_SIZE={}", |
4164020e SM |
550 | file_index_entry_size, CTF_INDEX_1_0_SIZE); |
551 | goto error; | |
552 | } | |
553 | ||
554 | file_entry_count = (filesize - sizeof(*header)) / file_index_entry_size; | |
555 | if ((filesize - sizeof(*header)) % file_index_entry_size) { | |
0f5c5d5c SM |
556 | BT_CPPLOGW_SPEC(ds_file->logger, |
557 | "Invalid LTTng trace index: the index's size after the header " | |
558 | "({} bytes) is not a multiple of the index entry size " | |
559 | "({} bytes)", | |
560 | (filesize - sizeof(*header)), sizeof(*header)); | |
4164020e SM |
561 | goto error; |
562 | } | |
563 | ||
2fb7af12 | 564 | index = ctf_fs_ds_index_create(); |
4164020e SM |
565 | if (!index) { |
566 | goto error; | |
567 | } | |
568 | ||
569 | for (i = 0; i < file_entry_count; i++) { | |
570 | struct ctf_packet_index *file_index = (struct ctf_packet_index *) file_pos; | |
ef7d7ac2 | 571 | const auto packetSize = bt2c::DataLen::fromBits(be64toh(file_index->packet_size)); |
4164020e | 572 | |
ef7d7ac2 | 573 | if (packetSize.hasExtraBits()) { |
0f5c5d5c SM |
574 | BT_CPPLOGW_SPEC(ds_file->logger, |
575 | "Invalid packet size encountered in LTTng trace index file"); | |
4164020e SM |
576 | goto error; |
577 | } | |
578 | ||
ef7d7ac2 SM |
579 | const auto offset = bt2c::DataLen::fromBytes(be64toh(file_index->offset)); |
580 | ||
581 | if (i != 0 && offset < prev_index_entry->offset) { | |
582 | BT_CPPLOGW_SPEC( | |
583 | ds_file->logger, | |
584 | "Invalid, non-monotonic, packet offset encountered in LTTng trace index file: " | |
585 | "previous offset={} bytes, current offset={} bytes", | |
586 | prev_index_entry->offset.bytes(), offset.bytes()); | |
587 | goto error; | |
588 | } | |
589 | ||
590 | index_entry = ctf_fs_ds_index_entry_create(offset, packetSize); | |
4164020e | 591 | if (!index_entry) { |
0f5c5d5c SM |
592 | BT_CPPLOGE_APPEND_CAUSE_SPEC(ds_file->logger, |
593 | "Failed to create a ctf_fs_ds_index_entry."); | |
4164020e SM |
594 | goto error; |
595 | } | |
596 | ||
597 | /* Set path to stream file. */ | |
4d199954 | 598 | index_entry->path = file_info->path.c_str(); |
4164020e | 599 | |
4164020e SM |
600 | index_entry->timestamp_begin = be64toh(file_index->timestamp_begin); |
601 | index_entry->timestamp_end = be64toh(file_index->timestamp_end); | |
602 | if (index_entry->timestamp_end < index_entry->timestamp_begin) { | |
0f5c5d5c SM |
603 | BT_CPPLOGW_SPEC( |
604 | ds_file->logger, | |
4164020e | 605 | "Invalid packet time bounds encountered in LTTng trace index file (begin > end): " |
0f5c5d5c | 606 | "timestamp_begin={}, timestamp_end={}", |
4164020e SM |
607 | index_entry->timestamp_begin, index_entry->timestamp_end); |
608 | goto error; | |
609 | } | |
610 | ||
611 | /* Convert the packet's bound to nanoseconds since Epoch. */ | |
612 | ret = convert_cycles_to_ns(sc->default_clock_class, index_entry->timestamp_begin, | |
613 | &index_entry->timestamp_begin_ns); | |
614 | if (ret) { | |
0f5c5d5c SM |
615 | BT_CPPLOGI_STR_SPEC( |
616 | ds_file->logger, | |
4164020e SM |
617 | "Failed to convert raw timestamp to nanoseconds since Epoch during index parsing"); |
618 | goto error; | |
619 | } | |
620 | ret = convert_cycles_to_ns(sc->default_clock_class, index_entry->timestamp_end, | |
621 | &index_entry->timestamp_end_ns); | |
622 | if (ret) { | |
0f5c5d5c SM |
623 | BT_CPPLOGI_STR_SPEC( |
624 | ds_file->logger, | |
4164020e SM |
625 | "Failed to convert raw timestamp to nanoseconds since Epoch during LTTng trace index parsing"); |
626 | goto error; | |
627 | } | |
628 | ||
629 | if (version_minor >= 1) { | |
630 | index_entry->packet_seq_num = be64toh(file_index->packet_seq_num); | |
631 | } | |
632 | ||
ef7d7ac2 | 633 | totalPacketsSize += packetSize; |
4164020e SM |
634 | file_pos += file_index_entry_size; |
635 | ||
c05e1405 | 636 | prev_index_entry = index_entry.get(); |
4164020e | 637 | |
2fb7af12 | 638 | index->entries.emplace_back(std::move(index_entry)); |
4164020e SM |
639 | } |
640 | ||
641 | /* Validate that the index addresses the complete stream. */ | |
ef7d7ac2 | 642 | if (ds_file->file->size != totalPacketsSize.bytes()) { |
0f5c5d5c SM |
643 | BT_CPPLOGW_SPEC(ds_file->logger, |
644 | "Invalid LTTng trace index file; indexed size != stream file size: " | |
ef7d7ac2 SM |
645 | "file-size={} bytes, total-packets-size={} bytes", |
646 | ds_file->file->size, totalPacketsSize.bytes()); | |
4164020e SM |
647 | goto error; |
648 | } | |
b6c3dcb2 | 649 | end: |
4164020e SM |
650 | g_free(directory); |
651 | g_free(basename); | |
652 | g_free(index_file_path); | |
653 | if (index_basename) { | |
654 | g_string_free(index_basename, TRUE); | |
655 | } | |
656 | if (mapped_file) { | |
657 | g_mapped_file_unref(mapped_file); | |
658 | } | |
659 | return index; | |
97ade20b | 660 | error: |
441fa755 | 661 | index.reset(); |
4164020e | 662 | goto end; |
b6c3dcb2 JG |
663 | } |
664 | ||
4164020e | 665 | static int init_index_entry(struct ctf_fs_ds_index_entry *entry, struct ctf_fs_ds_file *ds_file, |
ef7d7ac2 | 666 | struct ctf_msg_iter_packet_properties *props) |
9e0c8dbb | 667 | { |
4164020e SM |
668 | int ret = 0; |
669 | struct ctf_stream_class *sc; | |
4164020e SM |
670 | |
671 | sc = ctf_trace_class_borrow_stream_class_by_id(ds_file->metadata->tc, props->stream_class_id); | |
672 | BT_ASSERT(sc); | |
4164020e SM |
673 | |
674 | if (props->snapshots.beginning_clock != UINT64_C(-1)) { | |
675 | entry->timestamp_begin = props->snapshots.beginning_clock; | |
676 | ||
677 | /* Convert the packet's bound to nanoseconds since Epoch. */ | |
678 | ret = convert_cycles_to_ns(sc->default_clock_class, props->snapshots.beginning_clock, | |
679 | &entry->timestamp_begin_ns); | |
680 | if (ret) { | |
0f5c5d5c SM |
681 | BT_CPPLOGI_STR_SPEC(ds_file->logger, |
682 | "Failed to convert raw timestamp to nanoseconds since Epoch."); | |
4164020e SM |
683 | goto end; |
684 | } | |
685 | } else { | |
686 | entry->timestamp_begin = UINT64_C(-1); | |
687 | entry->timestamp_begin_ns = UINT64_C(-1); | |
688 | } | |
689 | ||
690 | if (props->snapshots.end_clock != UINT64_C(-1)) { | |
691 | entry->timestamp_end = props->snapshots.end_clock; | |
692 | ||
693 | /* Convert the packet's bound to nanoseconds since Epoch. */ | |
694 | ret = convert_cycles_to_ns(sc->default_clock_class, props->snapshots.end_clock, | |
695 | &entry->timestamp_end_ns); | |
696 | if (ret) { | |
0f5c5d5c SM |
697 | BT_CPPLOGI_STR_SPEC(ds_file->logger, |
698 | "Failed to convert raw timestamp to nanoseconds since Epoch."); | |
4164020e SM |
699 | goto end; |
700 | } | |
701 | } else { | |
702 | entry->timestamp_end = UINT64_C(-1); | |
703 | entry->timestamp_end_ns = UINT64_C(-1); | |
704 | } | |
0b29603d | 705 | |
9e0c8dbb | 706 | end: |
4164020e | 707 | return ret; |
9e0c8dbb JG |
708 | } |
709 | ||
441fa755 SM |
710 | static ctf_fs_ds_index::UP build_index_from_stream_file(struct ctf_fs_ds_file *ds_file, |
711 | struct ctf_fs_ds_file_info *file_info, | |
712 | struct ctf_msg_iter *msg_iter) | |
9e0c8dbb | 713 | { |
4164020e | 714 | int ret; |
441fa755 | 715 | ctf_fs_ds_index::UP index; |
4164020e | 716 | enum ctf_msg_iter_status iter_status = CTF_MSG_ITER_STATUS_OK; |
ef7d7ac2 | 717 | auto currentPacketOffset = bt2c::DataLen::fromBytes(0); |
4164020e | 718 | |
a39d9817 | 719 | BT_CPPLOGI_SPEC(ds_file->logger, "Indexing stream file {}", ds_file->file->path); |
4164020e | 720 | |
2fb7af12 | 721 | index = ctf_fs_ds_index_create(); |
4164020e SM |
722 | if (!index) { |
723 | goto error; | |
724 | } | |
725 | ||
726 | while (true) { | |
4164020e SM |
727 | struct ctf_msg_iter_packet_properties props; |
728 | ||
ef7d7ac2 | 729 | if (currentPacketOffset.bytes() > ds_file->file->size) { |
0f5c5d5c SM |
730 | BT_CPPLOGE_STR_SPEC(ds_file->logger, |
731 | "Unexpected current packet's offset (larger than file)."); | |
4164020e | 732 | goto error; |
ef7d7ac2 | 733 | } else if (currentPacketOffset.bytes() == ds_file->file->size) { |
4164020e SM |
734 | /* No more data */ |
735 | break; | |
736 | } | |
737 | ||
ef7d7ac2 | 738 | iter_status = ctf_msg_iter_seek(msg_iter, currentPacketOffset.bytes()); |
4164020e SM |
739 | if (iter_status != CTF_MSG_ITER_STATUS_OK) { |
740 | goto error; | |
741 | } | |
742 | ||
743 | iter_status = ctf_msg_iter_get_packet_properties(msg_iter, &props); | |
744 | if (iter_status != CTF_MSG_ITER_STATUS_OK) { | |
745 | goto error; | |
746 | } | |
747 | ||
ef7d7ac2 SM |
748 | /* |
749 | * Get the current packet size from the packet header, if set. Else, | |
750 | * assume there is a single packet in the file, so take the file size | |
751 | * as the packet size. | |
752 | */ | |
753 | const auto currentPacketSize = props.exp_packet_total_size >= 0 ? | |
754 | bt2c::DataLen::fromBits(props.exp_packet_total_size) : | |
755 | bt2c::DataLen::fromBytes(ds_file->file->size); | |
4164020e | 756 | |
ef7d7ac2 | 757 | if ((currentPacketOffset + currentPacketSize).bytes() > ds_file->file->size) { |
0f5c5d5c SM |
758 | BT_CPPLOGW_SPEC(ds_file->logger, |
759 | "Invalid packet size reported in file: stream=\"{}\", " | |
ef7d7ac2 SM |
760 | "packet-offset-bytes={}, packet-size-bytes={}, " |
761 | "file-size-bytes={}", | |
a39d9817 | 762 | ds_file->file->path, currentPacketOffset.bytes(), |
ef7d7ac2 | 763 | currentPacketSize.bytes(), ds_file->file->size); |
4164020e SM |
764 | goto error; |
765 | } | |
766 | ||
c05e1405 | 767 | auto index_entry = ctf_fs_ds_index_entry_create(currentPacketOffset, currentPacketSize); |
4164020e | 768 | if (!index_entry) { |
0f5c5d5c SM |
769 | BT_CPPLOGE_APPEND_CAUSE_SPEC(ds_file->logger, |
770 | "Failed to create a ctf_fs_ds_index_entry."); | |
4164020e SM |
771 | goto error; |
772 | } | |
773 | ||
774 | /* Set path to stream file. */ | |
4d199954 | 775 | index_entry->path = file_info->path.c_str(); |
4164020e | 776 | |
c05e1405 | 777 | ret = init_index_entry(index_entry.get(), ds_file, &props); |
4164020e | 778 | if (ret) { |
4164020e SM |
779 | goto error; |
780 | } | |
781 | ||
2fb7af12 | 782 | index->entries.emplace_back(std::move(index_entry)); |
4164020e | 783 | |
ef7d7ac2 | 784 | currentPacketOffset += currentPacketSize; |
0f5c5d5c | 785 | BT_CPPLOGD_SPEC(ds_file->logger, |
ef7d7ac2 SM |
786 | "Seeking to next packet: current-packet-offset-bytes={}, " |
787 | "next-packet-offset-bytes={}", | |
788 | (currentPacketOffset - currentPacketSize).bytes(), | |
789 | currentPacketOffset.bytes()); | |
4164020e | 790 | } |
312c056a | 791 | |
9e0c8dbb | 792 | end: |
4164020e | 793 | return index; |
312c056a | 794 | |
9e0c8dbb | 795 | error: |
441fa755 | 796 | index.reset(); |
4164020e | 797 | goto end; |
9e0c8dbb JG |
798 | } |
799 | ||
89f88383 SM |
800 | ctf_fs_ds_file::UP ctf_fs_ds_file_create(struct ctf_fs_trace *ctf_fs_trace, |
801 | bt2::Stream::Shared stream, const char *path, | |
802 | const bt2c::Logger& parentLogger) | |
e98a2d6e | 803 | { |
4164020e | 804 | int ret; |
89f88383 | 805 | auto ds_file = bt2s::make_unique<ctf_fs_ds_file>(parentLogger); |
0f5c5d5c | 806 | size_t offset_align; |
4164020e | 807 | |
c44dc433 | 808 | ds_file->file = ctf_fs_file_create(parentLogger); |
4164020e SM |
809 | if (!ds_file->file) { |
810 | goto error; | |
811 | } | |
812 | ||
265d4ba2 | 813 | ds_file->stream = std::move(stream); |
4164020e | 814 | ds_file->metadata = ctf_fs_trace->metadata; |
a39d9817 | 815 | ds_file->file->path = path; |
c44dc433 | 816 | ret = ctf_fs_file_open(ds_file->file.get(), "rb"); |
4164020e SM |
817 | if (ret) { |
818 | goto error; | |
819 | } | |
820 | ||
0f5c5d5c | 821 | offset_align = bt_mmap_get_offset_align_size(static_cast<int>(ds_file->logger.level())); |
4164020e SM |
822 | ds_file->mmap_max_len = offset_align * 2048; |
823 | ||
824 | goto end; | |
1a9f7075 | 825 | |
e98a2d6e | 826 | error: |
4164020e | 827 | /* Do not touch "borrowed" file. */ |
89f88383 | 828 | ds_file.reset(); |
1a9f7075 | 829 | |
e98a2d6e | 830 | end: |
4164020e | 831 | return ds_file; |
e98a2d6e PP |
832 | } |
833 | ||
441fa755 SM |
834 | ctf_fs_ds_index::UP ctf_fs_ds_file_build_index(struct ctf_fs_ds_file *ds_file, |
835 | struct ctf_fs_ds_file_info *file_info, | |
836 | struct ctf_msg_iter *msg_iter) | |
97ade20b | 837 | { |
441fa755 | 838 | auto index = build_index_from_idx_file(ds_file, file_info, msg_iter); |
4164020e SM |
839 | if (index) { |
840 | goto end; | |
841 | } | |
842 | ||
0f5c5d5c SM |
843 | BT_CPPLOGI_SPEC(ds_file->logger, "Failed to build index from .index file; " |
844 | "falling back to stream indexing."); | |
4164020e | 845 | index = build_index_from_stream_file(ds_file, file_info, msg_iter); |
9e0c8dbb | 846 | end: |
4164020e | 847 | return index; |
97ade20b JG |
848 | } |
849 | ||
2fb7af12 | 850 | ctf_fs_ds_index::UP ctf_fs_ds_index_create() |
7ed5243a | 851 | { |
bfd852f0 | 852 | return bt2s::make_unique<ctf_fs_ds_index>(); |
7ed5243a FD |
853 | } |
854 | ||
3199f1ba | 855 | ctf_fs_ds_file::~ctf_fs_ds_file() |
e98a2d6e | 856 | { |
3199f1ba | 857 | (void) ds_file_munmap(this); |
e98a2d6e | 858 | } |
4f1f88a6 | 859 | |
2cef6403 | 860 | ctf_fs_ds_file_info::UP ctf_fs_ds_file_info_create(const char *path, int64_t begin_ns) |
873c329a | 861 | { |
2cef6403 | 862 | ctf_fs_ds_file_info::UP ds_file_info = bt2s::make_unique<ctf_fs_ds_file_info>(); |
873c329a | 863 | |
4d199954 | 864 | ds_file_info->path = path; |
873c329a | 865 | ds_file_info->begin_ns = begin_ns; |
873c329a SM |
866 | return ds_file_info; |
867 | } | |
868 | ||
fe2e19c4 SM |
869 | ctf_fs_ds_file_group::UP ctf_fs_ds_file_group_create(struct ctf_fs_trace *ctf_fs_trace, |
870 | struct ctf_stream_class *sc, | |
871 | uint64_t stream_instance_id, | |
fe2f9cda | 872 | ctf_fs_ds_index::UP index) |
fe2e19c4 SM |
873 | { |
874 | ctf_fs_ds_file_group::UP ds_file_group {new ctf_fs_ds_file_group}; | |
875 | ||
fe2f9cda | 876 | ds_file_group->index = std::move(index); |
873c329a SM |
877 | |
878 | ds_file_group->stream_id = stream_instance_id; | |
879 | BT_ASSERT(sc); | |
880 | ds_file_group->sc = sc; | |
881 | ds_file_group->ctf_fs_trace = ctf_fs_trace; | |
873c329a | 882 | |
873c329a SM |
883 | return ds_file_group; |
884 | } |