1 // SPDX-License-Identifier: GPL-2.0
2 #include <errno.h>
3 #include <inttypes.h>
4 #include <linux/list.h>
5 #include <linux/compiler.h>
6 #include <linux/string.h>
7 #include "ordered-events.h"
8 #include "session.h"
9 #include "asm/bug.h"
10 #include "debug.h"
11 #include "ui/progress.h"
12
13 #define pr_N(n, fmt, ...) \
14 eprintf(n, debug_ordered_events, fmt, ##__VA_ARGS__)
15
16 #define pr(fmt, ...) pr_N(1, pr_fmt(fmt), ##__VA_ARGS__)
17
queue_event(struct ordered_events * oe,struct ordered_event * new)18 static void queue_event(struct ordered_events *oe, struct ordered_event *new)
19 {
20 struct ordered_event *last = oe->last;
21 u64 timestamp = new->timestamp;
22 struct list_head *p;
23
24 ++oe->nr_events;
25 oe->last = new;
26
27 pr_oe_time2(timestamp, "queue_event nr_events %u\n", oe->nr_events);
28
29 if (!last) {
30 list_add(&new->list, &oe->events);
31 oe->max_timestamp = timestamp;
32 return;
33 }
34
35 /*
36 * last event might point to some random place in the list as it's
37 * the last queued event. We expect that the new event is close to
38 * this.
39 */
40 if (last->timestamp <= timestamp) {
41 while (last->timestamp <= timestamp) {
42 p = last->list.next;
43 if (p == &oe->events) {
44 list_add_tail(&new->list, &oe->events);
45 oe->max_timestamp = timestamp;
46 return;
47 }
48 last = list_entry(p, struct ordered_event, list);
49 }
50 list_add_tail(&new->list, &last->list);
51 } else {
52 while (last->timestamp > timestamp) {
53 p = last->list.prev;
54 if (p == &oe->events) {
55 list_add(&new->list, &oe->events);
56 return;
57 }
58 last = list_entry(p, struct ordered_event, list);
59 }
60 list_add(&new->list, &last->list);
61 }
62 }
63
__dup_event(struct ordered_events * oe,union perf_event * event)64 static union perf_event *__dup_event(struct ordered_events *oe,
65 union perf_event *event)
66 {
67 union perf_event *new_event = NULL;
68
69 if (oe->cur_alloc_size < oe->max_alloc_size) {
70 new_event = memdup(event, event->header.size);
71 if (new_event)
72 oe->cur_alloc_size += event->header.size;
73 }
74
75 return new_event;
76 }
77
dup_event(struct ordered_events * oe,union perf_event * event)78 static union perf_event *dup_event(struct ordered_events *oe,
79 union perf_event *event)
80 {
81 return oe->copy_on_queue ? __dup_event(oe, event) : event;
82 }
83
__free_dup_event(struct ordered_events * oe,union perf_event * event)84 static void __free_dup_event(struct ordered_events *oe, union perf_event *event)
85 {
86 if (event) {
87 oe->cur_alloc_size -= event->header.size;
88 free(event);
89 }
90 }
91
free_dup_event(struct ordered_events * oe,union perf_event * event)92 static void free_dup_event(struct ordered_events *oe, union perf_event *event)
93 {
94 if (oe->copy_on_queue)
95 __free_dup_event(oe, event);
96 }
97
98 #define MAX_SAMPLE_BUFFER (64 * 1024 / sizeof(struct ordered_event))
alloc_event(struct ordered_events * oe,union perf_event * event)99 static struct ordered_event *alloc_event(struct ordered_events *oe,
100 union perf_event *event)
101 {
102 struct list_head *cache = &oe->cache;
103 struct ordered_event *new = NULL;
104 union perf_event *new_event;
105 size_t size;
106
107 new_event = dup_event(oe, event);
108 if (!new_event)
109 return NULL;
110
111 /*
112 * We maintain the following scheme of buffers for ordered
113 * event allocation:
114 *
115 * to_free list -> buffer1 (64K)
116 * buffer2 (64K)
117 * ...
118 *
119 * Each buffer keeps an array of ordered events objects:
120 * buffer -> event[0]
121 * event[1]
122 * ...
123 *
124 * Each allocated ordered event is linked to one of
125 * following lists:
126 * - time ordered list 'events'
127 * - list of currently removed events 'cache'
128 *
129 * Allocation of the ordered event uses the following order
130 * to get the memory:
131 * - use recently removed object from 'cache' list
132 * - use available object in current allocation buffer
133 * - allocate new buffer if the current buffer is full
134 *
135 * Removal of ordered event object moves it from events to
136 * the cache list.
137 */
138 size = sizeof(*oe->buffer) + MAX_SAMPLE_BUFFER * sizeof(*new);
139
140 if (!list_empty(cache)) {
141 new = list_entry(cache->next, struct ordered_event, list);
142 list_del_init(&new->list);
143 } else if (oe->buffer) {
144 new = &oe->buffer->event[oe->buffer_idx];
145 if (++oe->buffer_idx == MAX_SAMPLE_BUFFER)
146 oe->buffer = NULL;
147 } else if ((oe->cur_alloc_size + size) < oe->max_alloc_size) {
148 oe->buffer = malloc(size);
149 if (!oe->buffer) {
150 free_dup_event(oe, new_event);
151 return NULL;
152 }
153
154 pr("alloc size %" PRIu64 "B (+%zu), max %" PRIu64 "B\n",
155 oe->cur_alloc_size, size, oe->max_alloc_size);
156
157 oe->cur_alloc_size += size;
158 list_add(&oe->buffer->list, &oe->to_free);
159
160 oe->buffer_idx = 1;
161 new = &oe->buffer->event[0];
162 } else {
163 pr("allocation limit reached %" PRIu64 "B\n", oe->max_alloc_size);
164 return NULL;
165 }
166
167 new->event = new_event;
168 return new;
169 }
170
171 static struct ordered_event *
ordered_events__new_event(struct ordered_events * oe,u64 timestamp,union perf_event * event)172 ordered_events__new_event(struct ordered_events *oe, u64 timestamp,
173 union perf_event *event)
174 {
175 struct ordered_event *new;
176
177 new = alloc_event(oe, event);
178 if (new) {
179 new->timestamp = timestamp;
180 queue_event(oe, new);
181 }
182
183 return new;
184 }
185
ordered_events__delete(struct ordered_events * oe,struct ordered_event * event)186 void ordered_events__delete(struct ordered_events *oe, struct ordered_event *event)
187 {
188 list_move(&event->list, &oe->cache);
189 oe->nr_events--;
190 free_dup_event(oe, event->event);
191 event->event = NULL;
192 }
193
ordered_events__queue(struct ordered_events * oe,union perf_event * event,u64 timestamp,u64 file_offset,const char * file_path)194 int ordered_events__queue(struct ordered_events *oe, union perf_event *event,
195 u64 timestamp, u64 file_offset, const char *file_path)
196 {
197 struct ordered_event *oevent;
198
199 if (!timestamp || timestamp == ~0ULL)
200 return -ETIME;
201
202 if (timestamp < oe->last_flush) {
203 pr_oe_time(timestamp, "out of order event\n");
204 pr_oe_time(oe->last_flush, "last flush, last_flush_type %d\n",
205 oe->last_flush_type);
206
207 oe->nr_unordered_events++;
208 }
209
210 oevent = ordered_events__new_event(oe, timestamp, event);
211 if (!oevent) {
212 ordered_events__flush(oe, OE_FLUSH__HALF);
213 oevent = ordered_events__new_event(oe, timestamp, event);
214 }
215
216 if (!oevent)
217 return -ENOMEM;
218
219 oevent->file_offset = file_offset;
220 oevent->file_path = file_path;
221 return 0;
222 }
223
do_flush(struct ordered_events * oe,bool show_progress)224 static int do_flush(struct ordered_events *oe, bool show_progress)
225 {
226 struct list_head *head = &oe->events;
227 struct ordered_event *tmp, *iter;
228 u64 limit = oe->next_flush;
229 u64 last_ts = oe->last ? oe->last->timestamp : 0ULL;
230 struct ui_progress prog;
231 int ret;
232
233 if (!limit)
234 return 0;
235
236 if (show_progress)
237 ui_progress__init(&prog, oe->nr_events, "Processing time ordered events...");
238
239 list_for_each_entry_safe(iter, tmp, head, list) {
240 if (session_done())
241 return 0;
242
243 if (iter->timestamp > limit)
244 break;
245 ret = oe->deliver(oe, iter);
246 if (ret)
247 return ret;
248
249 ordered_events__delete(oe, iter);
250 oe->last_flush = iter->timestamp;
251
252 if (show_progress)
253 ui_progress__update(&prog, 1);
254 }
255
256 if (list_empty(head))
257 oe->last = NULL;
258 else if (last_ts <= limit)
259 oe->last = list_entry(head->prev, struct ordered_event, list);
260
261 if (show_progress)
262 ui_progress__finish();
263
264 return 0;
265 }
266
__ordered_events__flush(struct ordered_events * oe,enum oe_flush how,u64 timestamp)267 static int __ordered_events__flush(struct ordered_events *oe, enum oe_flush how,
268 u64 timestamp)
269 {
270 static const char * const str[] = {
271 "NONE",
272 "FINAL",
273 "ROUND",
274 "HALF ",
275 "TOP ",
276 "TIME ",
277 };
278 int err;
279 bool show_progress = false;
280
281 if (oe->nr_events == 0)
282 return 0;
283
284 switch (how) {
285 case OE_FLUSH__FINAL:
286 show_progress = true;
287 fallthrough;
288 case OE_FLUSH__TOP:
289 oe->next_flush = ULLONG_MAX;
290 break;
291
292 case OE_FLUSH__HALF:
293 {
294 struct ordered_event *first, *last;
295 struct list_head *head = &oe->events;
296
297 first = list_entry(head->next, struct ordered_event, list);
298 last = oe->last;
299
300 /* Warn if we are called before any event got allocated. */
301 if (WARN_ONCE(!last || list_empty(head), "empty queue"))
302 return 0;
303
304 oe->next_flush = first->timestamp;
305 oe->next_flush += (last->timestamp - first->timestamp) / 2;
306 break;
307 }
308
309 case OE_FLUSH__TIME:
310 oe->next_flush = timestamp;
311 show_progress = false;
312 break;
313
314 case OE_FLUSH__ROUND:
315 case OE_FLUSH__NONE:
316 default:
317 break;
318 }
319
320 pr_oe_time(oe->next_flush, "next_flush - ordered_events__flush PRE %s, nr_events %u\n",
321 str[how], oe->nr_events);
322 pr_oe_time(oe->max_timestamp, "max_timestamp\n");
323
324 err = do_flush(oe, show_progress);
325
326 if (!err) {
327 if (how == OE_FLUSH__ROUND)
328 oe->next_flush = oe->max_timestamp;
329
330 oe->last_flush_type = how;
331 }
332
333 pr_oe_time(oe->next_flush, "next_flush - ordered_events__flush POST %s, nr_events %u\n",
334 str[how], oe->nr_events);
335 pr_oe_time(oe->last_flush, "last_flush\n");
336
337 return err;
338 }
339
ordered_events__flush(struct ordered_events * oe,enum oe_flush how)340 int ordered_events__flush(struct ordered_events *oe, enum oe_flush how)
341 {
342 return __ordered_events__flush(oe, how, 0);
343 }
344
ordered_events__flush_time(struct ordered_events * oe,u64 timestamp)345 int ordered_events__flush_time(struct ordered_events *oe, u64 timestamp)
346 {
347 return __ordered_events__flush(oe, OE_FLUSH__TIME, timestamp);
348 }
349
ordered_events__first_time(struct ordered_events * oe)350 u64 ordered_events__first_time(struct ordered_events *oe)
351 {
352 struct ordered_event *event;
353
354 if (list_empty(&oe->events))
355 return 0;
356
357 event = list_first_entry(&oe->events, struct ordered_event, list);
358 return event->timestamp;
359 }
360
ordered_events__init(struct ordered_events * oe,ordered_events__deliver_t deliver,void * data)361 void ordered_events__init(struct ordered_events *oe, ordered_events__deliver_t deliver,
362 void *data)
363 {
364 INIT_LIST_HEAD(&oe->events);
365 INIT_LIST_HEAD(&oe->cache);
366 INIT_LIST_HEAD(&oe->to_free);
367 oe->max_alloc_size = (u64) -1;
368 oe->cur_alloc_size = 0;
369 oe->deliver = deliver;
370 oe->data = data;
371 }
372
373 static void
ordered_events_buffer__free(struct ordered_events_buffer * buffer,unsigned int max,struct ordered_events * oe)374 ordered_events_buffer__free(struct ordered_events_buffer *buffer,
375 unsigned int max, struct ordered_events *oe)
376 {
377 if (oe->copy_on_queue) {
378 unsigned int i;
379
380 for (i = 0; i < max; i++)
381 __free_dup_event(oe, buffer->event[i].event);
382 }
383
384 free(buffer);
385 }
386
ordered_events__free(struct ordered_events * oe)387 void ordered_events__free(struct ordered_events *oe)
388 {
389 struct ordered_events_buffer *buffer, *tmp;
390
391 if (list_empty(&oe->to_free))
392 return;
393
394 /*
395 * Current buffer might not have all the events allocated
396 * yet, we need to free only allocated ones ...
397 */
398 if (oe->buffer) {
399 list_del_init(&oe->buffer->list);
400 ordered_events_buffer__free(oe->buffer, oe->buffer_idx, oe);
401 }
402
403 /* ... and continue with the rest */
404 list_for_each_entry_safe(buffer, tmp, &oe->to_free, list) {
405 list_del_init(&buffer->list);
406 ordered_events_buffer__free(buffer, MAX_SAMPLE_BUFFER, oe);
407 }
408 }
409
ordered_events__reinit(struct ordered_events * oe)410 void ordered_events__reinit(struct ordered_events *oe)
411 {
412 ordered_events__deliver_t old_deliver = oe->deliver;
413
414 ordered_events__free(oe);
415 memset(oe, '\0', sizeof(*oe));
416 ordered_events__init(oe, old_deliver, oe->data);
417 }
418