aboutsummaryrefslogtreecommitdiff
path: root/spall.h
blob: e7f564153a546f5339b42e0d3558164547fa930b (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
// SPDX-FileCopyrightText: © 2023 Phillip Trudeau-Tavara <pmttavara@protonmail.com>
// SPDX-License-Identifier: MIT

/*

TODO: Optional Helper APIs:

  - Compression API: would require a mutexed lockable context (yuck...)
      - Either using a ZIP library, a name cache + TIDPID cache, or both (but ZIP is likely more than enough!!!)
      - begin()/end() writes compressed chunks to a caller-determined destination
          - The destination can be the buffered-writing API or a custom user destination
      - Ultimately need to take a lock with some granularity... can that be the caller's responsibility?

  - Counter Event: should allow tracking arbitrary named values with a single event, for memory and frame profiling

  - Ring-buffer API
        spall_ring_init
        spall_ring_emit_begin
        spall_ring_emit_end
        spall_ring_flush
*/

#ifndef SPALL_H
#define SPALL_H

#if !defined(_MSC_VER) || defined(__clang__)
#define SPALL_NOINSTRUMENT __attribute__((no_instrument_function))
#define SPALL_FORCEINLINE __attribute__((always_inline))
#else
#define _CRT_SECURE_NO_WARNINGS
#define SPALL_NOINSTRUMENT // Can't noinstrument on MSVC!
#define SPALL_FORCEINLINE __forceinline
#endif

#include <stdint.h>
#include <stdio.h>
#include <string.h>
#include <stdbool.h>

#define SPALL_FN static inline SPALL_NOINSTRUMENT
#define SPALL_MIN(a, b) (((a) < (b)) ? (a) : (b))
#define SPALL_MAX(a, b) (((a) > (b)) ? (a) : (b))

#pragma pack(push, 1)

typedef struct SpallHeader {
    uint64_t magic_header; // = 0x0BADF00D
    uint64_t version; // = 3
    double   timestamp_unit;
    uint64_t must_be_0;
} SpallHeader;

typedef enum {
    SpallEventType_Invalid             = 0,
    SpallEventType_Custom_Data         = 1, // Basic readers can skip this.
    SpallEventType_StreamOver          = 2,

    SpallEventType_Begin               = 3,
    SpallEventType_End                 = 4,
    SpallEventType_Instant             = 5,

    SpallEventType_Overwrite_Timestamp = 6, // Retroactively change timestamp units - useful for incrementally improving RDTSC frequency.
    SpallEventType_Pad_Skip            = 7,

	SpallEventType_NameProcess         = 8,
	SpallEventType_NameThread          = 9,
} SpallEventType;

typedef struct SpallBufferHeader {
	uint32_t size;
	uint32_t tid;
	uint32_t pid;
	uint64_t first_ts;
} SpallBufferHeader;

typedef struct SpallBeginEvent {
    uint8_t type; // = SpallEventType_Begin
    uint64_t when;

    uint8_t name_length;
    uint8_t args_length;
} SpallBeginEvent;

typedef struct SpallBeginEventMax {
    SpallBeginEvent event;
    char name_bytes[255];
    char args_bytes[255];
} SpallBeginEventMax;

typedef struct SpallEndEvent {
    uint8_t  type; // = SpallEventType_End
    uint64_t when;
} SpallEndEvent;

typedef struct SpallPadSkipEvent {
    uint8_t  type; // = SpallEventType_Pad_Skip
    uint32_t size;
} SpallPadSkipEvent;

typedef struct SpallNameContainerEvent {
	uint8_t type; // = SpallEventType_NameThread/Process
	uint8_t name_length;
} SpallNameContainerEvent;

typedef struct SpallNameContainerEventMax {
    SpallNameContainerEvent event;
    char name_bytes[255];
} SpallNameContainerEventMax;

#pragma pack(pop)

typedef struct SpallProfile SpallProfile;

// Important!: If you define your own callbacks, mark them SPALL_NOINSTRUMENT!
typedef bool (*SpallWriteCallback)(SpallProfile *self, const void *data, size_t length);
typedef bool (*SpallFlushCallback)(SpallProfile *self);
typedef void (*SpallCloseCallback)(SpallProfile *self);

struct SpallProfile {
    double timestamp_unit;
    SpallWriteCallback write;
    SpallFlushCallback flush;
    SpallCloseCallback close;
    void *data;
};

// Important!: If you are writing Begin/End events, then do NOT write
//             events for the same PID + TID pair on different buffers!!!
typedef struct SpallBuffer {
    void *data;
    size_t length;
	uint32_t tid;
	uint32_t pid;

    // Internal data - don't assign this
    size_t head;
	uint64_t first_ts;
} SpallBuffer;

#ifdef __cplusplus
extern "C" {
#endif

SPALL_FN SPALL_FORCEINLINE bool spall__file_write(SpallProfile *ctx, const void *p, size_t n) {
    if (fwrite(p, n, 1, (FILE *)ctx->data) != 1) return false;
    return true;
}
SPALL_FN bool spall__file_flush(SpallProfile *ctx) {
    if (fflush((FILE *)ctx->data)) return false;
    return true;
}
SPALL_FN void spall__file_close(SpallProfile *ctx) {
    fclose((FILE *)ctx->data);
    ctx->data = NULL;
}

SPALL_FN SPALL_FORCEINLINE bool spall__buffer_flush(SpallProfile *ctx, SpallBuffer *wb, uint64_t ts) {
	wb->first_ts = SPALL_MAX(wb->first_ts, ts);

	SpallBufferHeader hdr;
	hdr.size = wb->head - sizeof(SpallBufferHeader);
	hdr.pid = wb->pid;
	hdr.tid = wb->tid;
	hdr.first_ts = wb->first_ts;

	memcpy(wb->data, &hdr, sizeof(hdr));

	if (!ctx->write(ctx, wb->data, wb->head)) return false;
    wb->head = sizeof(SpallBufferHeader);
    return true;
}

SPALL_FN bool spall_buffer_flush(SpallProfile *ctx, SpallBuffer *wb) {
    if (!spall__buffer_flush(ctx, wb, 0)) return false;
    return true;
}

SPALL_FN bool spall_buffer_quit(SpallProfile *ctx, SpallBuffer *wb) {
    if (!spall_buffer_flush(ctx, wb)) return false;
    return true;
}

SPALL_FN size_t spall_build_header(void *buffer, size_t rem_size, double timestamp_unit) {
    size_t header_size = sizeof(SpallHeader);
    if (header_size > rem_size) {
        return 0;
    }

    SpallHeader *header = (SpallHeader *)buffer;
    header->magic_header = 0x0BADF00D;
    header->version = 3;
    header->timestamp_unit = timestamp_unit;
    header->must_be_0 = 0;
    return header_size;
}
SPALL_FN SPALL_FORCEINLINE size_t spall_build_begin(void *buffer, size_t rem_size, const char *name, int32_t name_len, const char *args, int32_t args_len, uint64_t when) {
    SpallBeginEventMax *ev = (SpallBeginEventMax *)buffer;
    uint8_t trunc_name_len = (uint8_t)SPALL_MIN(name_len, 255); // will be interpreted as truncated in the app (?)
    uint8_t trunc_args_len = (uint8_t)SPALL_MIN(args_len, 255); // will be interpreted as truncated in the app (?)

    size_t ev_size = sizeof(SpallBeginEvent) + trunc_name_len + trunc_args_len;
    if (ev_size > rem_size) {
        return 0;
    }

    ev->event.type = SpallEventType_Begin;
    ev->event.when = when;
    ev->event.name_length = trunc_name_len;
    ev->event.args_length = trunc_args_len;
    memcpy(ev->name_bytes,                  name, trunc_name_len);
    memcpy(ev->name_bytes + trunc_name_len, args, trunc_args_len);

    return ev_size;
}
SPALL_FN SPALL_FORCEINLINE size_t spall_build_end(void *buffer, size_t rem_size, uint64_t when) {
    size_t ev_size = sizeof(SpallEndEvent);
    if (ev_size > rem_size) {
        return 0;
    }

    SpallEndEvent *ev = (SpallEndEvent *)buffer;
    ev->type = SpallEventType_End;
    ev->when = when;

    return ev_size;
}
SPALL_FN SPALL_FORCEINLINE size_t spall_build_name(void *buffer, size_t rem_size, const char *name, int32_t name_len, SpallEventType type) {
    SpallNameContainerEventMax *ev = (SpallNameContainerEventMax *)buffer;
    uint8_t trunc_name_len = (uint8_t)SPALL_MIN(name_len, 255); // will be interpreted as truncated in the app (?)

    size_t ev_size = sizeof(SpallNameContainerEvent) + trunc_name_len;
    if (ev_size > rem_size) {
        return 0;
    }

    ev->event.type = type;
    ev->event.name_length = trunc_name_len;
    memcpy(ev->name_bytes, name, trunc_name_len);

    return ev_size;
}

SPALL_FN void spall_quit(SpallProfile *ctx) {
    if (!ctx) return;
    if (ctx->close) ctx->close(ctx);

    memset(ctx, 0, sizeof(*ctx));
}

SPALL_FN bool spall_init_callbacks(double timestamp_unit,
								   SpallWriteCallback write,
								   SpallFlushCallback flush,
								   SpallCloseCallback close,
								   void *userdata,
								   SpallProfile *ctx) {

    if (timestamp_unit < 0) return false;

    memset(ctx, 0, sizeof(*ctx));
    ctx->timestamp_unit = timestamp_unit;
    ctx->data = userdata;
    ctx->write = write;
    ctx->flush = flush;
    ctx->close = close;

	SpallHeader header;
	size_t len = spall_build_header(&header, sizeof(header), timestamp_unit);
	if (!ctx->write(ctx, &header, len)) {
		spall_quit(ctx);
		return false;
	}

    return true;
}

SPALL_FN bool spall_init_file(const char* filename, double timestamp_unit, SpallProfile *ctx) {
    if (!filename) return false;

    FILE *f = fopen(filename, "wb"); // TODO: handle utf8 and long paths on windows
    if (f) { // basically freopen() but we don't want to force users to lug along another macro define
        fclose(f);
        f = fopen(filename, "ab");
    }
	if (!f) { return false; }

    return spall_init_callbacks(timestamp_unit, spall__file_write, spall__file_flush, spall__file_close, (void *)f, ctx);
}

SPALL_FN bool spall_flush(SpallProfile *ctx) {
    if (!ctx->flush(ctx)) return false;
    return true;
}

SPALL_FN bool spall_buffer_init(SpallProfile *ctx, SpallBuffer *wb) {
	// Fails if buffer is not big enough to contain at least one event!
	if (wb->length < sizeof(SpallBufferHeader) + sizeof(SpallBeginEventMax)) {
		return false;
	}

	wb->head = sizeof(SpallBufferHeader);
	return true;
}


SPALL_FN SPALL_FORCEINLINE bool spall_buffer_begin_args(SpallProfile *ctx, SpallBuffer *wb, const char *name, int32_t name_len, const char *args, int32_t args_len, uint64_t when) {
	if ((wb->head + sizeof(SpallBeginEventMax)) > wb->length) {
		if (!spall__buffer_flush(ctx, wb, when)) {
			return false;
		}
	}

	wb->head += spall_build_begin((char *)wb->data + wb->head, wb->length - wb->head, name, name_len, args, args_len, when);

    return true;
}

SPALL_FN bool spall_buffer_begin(SpallProfile *ctx, SpallBuffer *wb, const char *name, int32_t name_len, uint64_t when) {
    return spall_buffer_begin_args(ctx, wb, name, name_len, "", 0, when);
}

SPALL_FN bool spall_buffer_end(SpallProfile *ctx, SpallBuffer *wb, uint64_t when) {
	if ((wb->head + sizeof(SpallEndEvent)) > wb->length) {
		if (!spall__buffer_flush(ctx, wb, when)) {
			return false;
		}
	}

	wb->head += spall_build_end((char *)wb->data + wb->head, wb->length - wb->head, when);
	return true;
}

SPALL_FN bool spall_buffer_name_thread(SpallProfile *ctx, SpallBuffer *wb, const char *name, int32_t name_len) {
	if ((wb->head + sizeof(SpallNameContainerEvent)) > wb->length) {
		if (!spall__buffer_flush(ctx, wb, 0)) {
			return false;
		}
	}

	wb->head += spall_build_name((char *)wb->data + wb->head, wb->length - wb->head, name, name_len, SpallEventType_NameThread);
	return true;
}

SPALL_FN bool spall_buffer_name_process(SpallProfile *ctx, SpallBuffer *wb, const char *name, int32_t name_len) {
	if ((wb->head + sizeof(SpallNameContainerEvent)) > wb->length) {
		if (!spall__buffer_flush(ctx, wb, 0)) {
			return false;
		}
	}

	wb->head += spall_build_name((char *)wb->data + wb->head, wb->length - wb->head, name, name_len, SpallEventType_NameProcess);
	return true;
}

#ifdef __cplusplus
}
#endif

#endif // SPALL_H