1 // SPDX-License-Identifier: GPL-2.0
2 #include <errno.h>
3 #include <inttypes.h>
4 #include <linux/list.h>
5 #include <linux/compiler.h>
6 #include <linux/string.h>
7 #include "ordered-events.h"
8 #include "session.h"
9 #include "asm/bug.h"
10 #include "debug.h"
11 #include "ui/progress.h"
12
13 #define pr_N(n, fmt, ...) \
14 eprintf(n, debug_ordered_events, fmt, ##__VA_ARGS__)
15
16 #define pr(fmt, ...) pr_N(1, pr_fmt(fmt), ##__VA_ARGS__)
17
queue_event(struct ordered_events * oe,struct ordered_event * new)18 static void queue_event(struct ordered_events *oe, struct ordered_event *new)
19 {
20 struct ordered_event *last = oe->last;
21 u64 timestamp = new->timestamp;
22 struct list_head *p;
23
24 ++oe->nr_events;
25 oe->last = new;
26
27 pr_oe_time2(timestamp, "queue_event nr_events %u\n", oe->nr_events);
28
29 if (!last) {
30 list_add(&new->list, &oe->events);
31 oe->max_timestamp = timestamp;
32 return;
33 }
34
35 /*
36 * last event might point to some random place in the list as it's
37 * the last queued event. We expect that the new event is close to
38 * this.
39 */
40 if (last->timestamp <= timestamp) {
41 while (last->timestamp <= timestamp) {
42 p = last->list.next;
43 if (p == &oe->events) {
44 list_add_tail(&new->list, &oe->events);
45 oe->max_timestamp = timestamp;
46 return;
47 }
48 last = list_entry(p, struct ordered_event, list);
49 }
50 list_add_tail(&new->list, &last->list);
51 } else {
52 while (last->timestamp > timestamp) {
53 p = last->list.prev;
54 if (p == &oe->events) {
55 list_add(&new->list, &oe->events);
56 return;
57 }
58 last = list_entry(p, struct ordered_event, list);
59 }
60 list_add(&new->list, &last->list);
61 }
62 }
63
__dup_event(struct ordered_events * oe,union perf_event * event)64 static union perf_event *__dup_event(struct ordered_events *oe,
65 union perf_event *event)
66 {
67 union perf_event *new_event = NULL;
68
69 if (oe->cur_alloc_size < oe->max_alloc_size) {
70 new_event = memdup(event, event->header.size);
71 if (new_event)
72 oe->cur_alloc_size += event->header.size;
73 }
74
75 return new_event;
76 }
77
dup_event(struct ordered_events * oe,union perf_event * event)78 static union perf_event *dup_event(struct ordered_events *oe,
79 union perf_event *event)
80 {
81 return oe->copy_on_queue ? __dup_event(oe, event) : event;
82 }
83
__free_dup_event(struct ordered_events * oe,union perf_event * event)84 static void __free_dup_event(struct ordered_events *oe, union perf_event *event)
85 {
86 if (event) {
87 oe->cur_alloc_size -= event->header.size;
88 free(event);
89 }
90 }
91
free_dup_event(struct ordered_events * oe,union perf_event * event)92 static void free_dup_event(struct ordered_events *oe, union perf_event *event)
93 {
94 if (oe->copy_on_queue)
95 __free_dup_event(oe, event);
96 }
97
98 #define MAX_SAMPLE_BUFFER (64 * 1024 / sizeof(struct ordered_event))
alloc_event(struct ordered_events * oe,union perf_event * event)99 static struct ordered_event *alloc_event(struct ordered_events *oe,
100 union perf_event *event)
101 {
102 struct list_head *cache = &oe->cache;
103 struct ordered_event *new = NULL;
104 union perf_event *new_event;
105 size_t size;
106
107 new_event = dup_event(oe, event);
108 if (!new_event)
109 return NULL;
110
111 /*
112 * We maintain the following scheme of buffers for ordered
113 * event allocation:
114 *
115 * to_free list -> buffer1 (64K)
116 * buffer2 (64K)
117 * ...
118 *
119 * Each buffer keeps an array of ordered events objects:
120 * buffer -> event[0]
121 * event[1]
122 * ...
123 *
124 * Each allocated ordered event is linked to one of
125 * following lists:
126 * - time ordered list 'events'
127 * - list of currently removed events 'cache'
128 *
129 * Allocation of the ordered event uses the following order
130 * to get the memory:
131 * - use recently removed object from 'cache' list
132 * - use available object in current allocation buffer
133 * - allocate new buffer if the current buffer is full
134 *
135 * Removal of ordered event object moves it from events to
136 * the cache list.
137 */
138 size = sizeof(*oe->buffer) + MAX_SAMPLE_BUFFER * sizeof(*new);
139
140 if (!list_empty(cache)) {
141 new = list_entry(cache->next, struct ordered_event, list);
142 list_del_init(&new->list);
143 } else if (oe->buffer) {
144 new = &oe->buffer->event[oe->buffer_idx];
145 if (++oe->buffer_idx == MAX_SAMPLE_BUFFER)
146 oe->buffer = NULL;
147 } else if ((oe->cur_alloc_size + size) < oe->max_alloc_size) {
148 oe->buffer = malloc(size);
149 if (!oe->buffer) {
150 free_dup_event(oe, new_event);
151 return NULL;
152 }
153
154 pr("alloc size %" PRIu64 "B (+%zu), max %" PRIu64 "B\n",
155 oe->cur_alloc_size, size, oe->max_alloc_size);
156
157 oe->cur_alloc_size += size;
158 list_add(&oe->buffer->list, &oe->to_free);
159
160 oe->buffer_idx = 1;
161 new = &oe->buffer->event[0];
162 } else {
163 pr("allocation limit reached %" PRIu64 "B\n", oe->max_alloc_size);
164 return NULL;
165 }
166
167 new->event = new_event;
168 return new;
169 }
170
171 static struct ordered_event *
ordered_events__new_event(struct ordered_events * oe,u64 timestamp,union perf_event * event)172 ordered_events__new_event(struct ordered_events *oe, u64 timestamp,
173 union perf_event *event)
174 {
175 struct ordered_event *new;
176
177 new = alloc_event(oe, event);
178 if (new) {
179 new->timestamp = timestamp;
180 queue_event(oe, new);
181 }
182
183 return new;
184 }
185
ordered_events__delete(struct ordered_events * oe,struct ordered_event * event)186 void ordered_events__delete(struct ordered_events *oe, struct ordered_event *event)
187 {
188 list_move(&event->list, &oe->cache);
189 oe->nr_events--;
190 free_dup_event(oe, event->event);
191 event->event = NULL;
192 }
193
ordered_events__queue(struct ordered_events * oe,union perf_event * event,u64 timestamp,u64 file_offset)194 int ordered_events__queue(struct ordered_events *oe, union perf_event *event,
195 u64 timestamp, u64 file_offset)
196 {
197 struct ordered_event *oevent;
198
199 if (!timestamp || timestamp == ~0ULL)
200 return -ETIME;
201
202 if (timestamp < oe->last_flush) {
203 pr_oe_time(timestamp, "out of order event\n");
204 pr_oe_time(oe->last_flush, "last flush, last_flush_type %d\n",
205 oe->last_flush_type);
206
207 oe->nr_unordered_events++;
208 }
209
210 oevent = ordered_events__new_event(oe, timestamp, event);
211 if (!oevent) {
212 ordered_events__flush(oe, OE_FLUSH__HALF);
213 oevent = ordered_events__new_event(oe, timestamp, event);
214 }
215
216 if (!oevent)
217 return -ENOMEM;
218
219 oevent->file_offset = file_offset;
220 return 0;
221 }
222
do_flush(struct ordered_events * oe,bool show_progress)223 static int do_flush(struct ordered_events *oe, bool show_progress)
224 {
225 struct list_head *head = &oe->events;
226 struct ordered_event *tmp, *iter;
227 u64 limit = oe->next_flush;
228 u64 last_ts = oe->last ? oe->last->timestamp : 0ULL;
229 struct ui_progress prog;
230 int ret;
231
232 if (!limit)
233 return 0;
234
235 if (show_progress)
236 ui_progress__init(&prog, oe->nr_events, "Processing time ordered events...");
237
238 list_for_each_entry_safe(iter, tmp, head, list) {
239 if (session_done())
240 return 0;
241
242 if (iter->timestamp > limit)
243 break;
244 ret = oe->deliver(oe, iter);
245 if (ret)
246 return ret;
247
248 ordered_events__delete(oe, iter);
249 oe->last_flush = iter->timestamp;
250
251 if (show_progress)
252 ui_progress__update(&prog, 1);
253 }
254
255 if (list_empty(head))
256 oe->last = NULL;
257 else if (last_ts <= limit)
258 oe->last = list_entry(head->prev, struct ordered_event, list);
259
260 if (show_progress)
261 ui_progress__finish();
262
263 return 0;
264 }
265
__ordered_events__flush(struct ordered_events * oe,enum oe_flush how,u64 timestamp)266 static int __ordered_events__flush(struct ordered_events *oe, enum oe_flush how,
267 u64 timestamp)
268 {
269 static const char * const str[] = {
270 "NONE",
271 "FINAL",
272 "ROUND",
273 "HALF ",
274 "TOP ",
275 "TIME ",
276 };
277 int err;
278 bool show_progress = false;
279
280 if (oe->nr_events == 0)
281 return 0;
282
283 switch (how) {
284 case OE_FLUSH__FINAL:
285 show_progress = true;
286 __fallthrough;
287 case OE_FLUSH__TOP:
288 oe->next_flush = ULLONG_MAX;
289 break;
290
291 case OE_FLUSH__HALF:
292 {
293 struct ordered_event *first, *last;
294 struct list_head *head = &oe->events;
295
296 first = list_entry(head->next, struct ordered_event, list);
297 last = oe->last;
298
299 /* Warn if we are called before any event got allocated. */
300 if (WARN_ONCE(!last || list_empty(head), "empty queue"))
301 return 0;
302
303 oe->next_flush = first->timestamp;
304 oe->next_flush += (last->timestamp - first->timestamp) / 2;
305 break;
306 }
307
308 case OE_FLUSH__TIME:
309 oe->next_flush = timestamp;
310 show_progress = false;
311 break;
312
313 case OE_FLUSH__ROUND:
314 case OE_FLUSH__NONE:
315 default:
316 break;
317 };
318
319 pr_oe_time(oe->next_flush, "next_flush - ordered_events__flush PRE %s, nr_events %u\n",
320 str[how], oe->nr_events);
321 pr_oe_time(oe->max_timestamp, "max_timestamp\n");
322
323 err = do_flush(oe, show_progress);
324
325 if (!err) {
326 if (how == OE_FLUSH__ROUND)
327 oe->next_flush = oe->max_timestamp;
328
329 oe->last_flush_type = how;
330 }
331
332 pr_oe_time(oe->next_flush, "next_flush - ordered_events__flush POST %s, nr_events %u\n",
333 str[how], oe->nr_events);
334 pr_oe_time(oe->last_flush, "last_flush\n");
335
336 return err;
337 }
338
ordered_events__flush(struct ordered_events * oe,enum oe_flush how)339 int ordered_events__flush(struct ordered_events *oe, enum oe_flush how)
340 {
341 return __ordered_events__flush(oe, how, 0);
342 }
343
ordered_events__flush_time(struct ordered_events * oe,u64 timestamp)344 int ordered_events__flush_time(struct ordered_events *oe, u64 timestamp)
345 {
346 return __ordered_events__flush(oe, OE_FLUSH__TIME, timestamp);
347 }
348
ordered_events__first_time(struct ordered_events * oe)349 u64 ordered_events__first_time(struct ordered_events *oe)
350 {
351 struct ordered_event *event;
352
353 if (list_empty(&oe->events))
354 return 0;
355
356 event = list_first_entry(&oe->events, struct ordered_event, list);
357 return event->timestamp;
358 }
359
ordered_events__init(struct ordered_events * oe,ordered_events__deliver_t deliver,void * data)360 void ordered_events__init(struct ordered_events *oe, ordered_events__deliver_t deliver,
361 void *data)
362 {
363 INIT_LIST_HEAD(&oe->events);
364 INIT_LIST_HEAD(&oe->cache);
365 INIT_LIST_HEAD(&oe->to_free);
366 oe->max_alloc_size = (u64) -1;
367 oe->cur_alloc_size = 0;
368 oe->deliver = deliver;
369 oe->data = data;
370 }
371
372 static void
ordered_events_buffer__free(struct ordered_events_buffer * buffer,unsigned int max,struct ordered_events * oe)373 ordered_events_buffer__free(struct ordered_events_buffer *buffer,
374 unsigned int max, struct ordered_events *oe)
375 {
376 if (oe->copy_on_queue) {
377 unsigned int i;
378
379 for (i = 0; i < max; i++)
380 __free_dup_event(oe, buffer->event[i].event);
381 }
382
383 free(buffer);
384 }
385
ordered_events__free(struct ordered_events * oe)386 void ordered_events__free(struct ordered_events *oe)
387 {
388 struct ordered_events_buffer *buffer, *tmp;
389
390 if (list_empty(&oe->to_free))
391 return;
392
393 /*
394 * Current buffer might not have all the events allocated
395 * yet, we need to free only allocated ones ...
396 */
397 if (oe->buffer) {
398 list_del_init(&oe->buffer->list);
399 ordered_events_buffer__free(oe->buffer, oe->buffer_idx, oe);
400 }
401
402 /* ... and continue with the rest */
403 list_for_each_entry_safe(buffer, tmp, &oe->to_free, list) {
404 list_del_init(&buffer->list);
405 ordered_events_buffer__free(buffer, MAX_SAMPLE_BUFFER, oe);
406 }
407 }
408
ordered_events__reinit(struct ordered_events * oe)409 void ordered_events__reinit(struct ordered_events *oe)
410 {
411 ordered_events__deliver_t old_deliver = oe->deliver;
412
413 ordered_events__free(oe);
414 memset(oe, '\0', sizeof(*oe));
415 ordered_events__init(oe, old_deliver, oe->data);
416 }
417