@@ -173,6 +173,14 @@ class provider_allocator : public allocator_interface {
173
173
return argPos;
174
174
}
175
175
176
+ void preBench (::benchmark::State &state) override {
177
+ provider.preBench (state);
178
+ }
179
+
180
+ void postBench (::benchmark::State &state) override {
181
+ provider.postBench (state);
182
+ }
183
+
176
184
void TearDown (::benchmark::State &state) override {
177
185
provider.TearDown (state);
178
186
}
@@ -204,13 +212,18 @@ template <typename Pool> class pool_allocator : public allocator_interface {
204
212
return argPos;
205
213
}
206
214
215
+ void preBench (::benchmark::State &state) override { pool.preBench (state); }
216
+ void postBench (::benchmark::State &state) override {
217
+ pool.postBench (state);
218
+ }
219
+
207
220
void TearDown (::benchmark::State &state) override { pool.TearDown (state); }
208
221
209
- virtual void *benchAlloc (size_t size) override {
222
+ void *benchAlloc (size_t size) override {
210
223
return umfPoolMalloc (pool.pool , size);
211
224
}
212
225
213
- virtual void benchFree (void *ptr, [[maybe_unused]] size_t size) override {
226
+ void benchFree (void *ptr, [[maybe_unused]] size_t size) override {
214
227
umfPoolFree (pool.pool , ptr);
215
228
}
216
229
@@ -241,7 +254,7 @@ struct benchmark_interface : public benchmark::Fixture {
241
254
allocator.TearDown (state);
242
255
}
243
256
244
- virtual void bench (::benchmark::State &state) = 0 ;
257
+ void bench ([[maybe_unused]] ::benchmark::State &state){} ;
245
258
246
259
virtual std::vector<std::string> argsName () {
247
260
auto s = Size::argsName ();
@@ -260,6 +273,9 @@ struct benchmark_interface : public benchmark::Fixture {
260
273
benchmark->ArgNames (bench->argsName ())->Name (bench->name ());
261
274
}
262
275
276
+ void custom_counters (::benchmark::State &state) {
277
+ allocator.custom_counters (state);
278
+ }
263
279
std::vector<Size > alloc_sizes;
264
280
Allocator allocator;
265
281
};
@@ -282,7 +298,7 @@ class multiple_malloc_free_benchmark : public benchmark_interface<Size, Alloc> {
282
298
283
299
vector2d<alloc_data> allocations;
284
300
std::vector<unsigned > iters;
285
-
301
+ std::vector< size_t > memused;
286
302
vector2d<next_alloc_data> next;
287
303
std::vector<std::vector<next_alloc_data>::const_iterator> next_iter;
288
304
int64_t iterations;
@@ -302,6 +318,10 @@ class multiple_malloc_free_benchmark : public benchmark_interface<Size, Alloc> {
302
318
allocations.resize (state.threads ());
303
319
next.resize (state.threads ());
304
320
next_iter.resize (state.threads ());
321
+ memused.resize (state.threads ());
322
+ for (int i = 0 ; i < state.threads (); i++) {
323
+ memused[i] = 0 ;
324
+ }
305
325
306
326
#ifndef WIN32
307
327
// Ensure that system malloc does not have memory pooled on the heap
@@ -323,13 +343,36 @@ class multiple_malloc_free_benchmark : public benchmark_interface<Size, Alloc> {
323
343
waitForAllThreads (state);
324
344
// prepare workload for actual benchmark.
325
345
freeAllocs (state);
346
+
326
347
prealloc (state);
327
348
prepareWorkload (state);
349
+ waitForAllThreads (state);
350
+ base::allocator.preBench (state);
328
351
}
329
352
330
353
void TearDown (::benchmark::State &state) override {
354
+ base::allocator.postBench (state);
331
355
auto tid = state.thread_index ();
356
+ if (tid == 0 ) {
357
+ size_t current_memory_allocated = 0 ;
358
+ for (int i = 0 ; i < state.threads (); i++) {
359
+ current_memory_allocated += memused[i];
360
+ }
361
+
362
+ size_t memory_used = state.counters [" provider_memory_allocated" ];
363
+
364
+ if (memory_used != 0 ) {
365
+ state.counters [" benchmark_memory_allocated" ] =
366
+ current_memory_allocated;
367
+ state.counters [" memory_overhead" ] =
368
+ 100.0 * (memory_used - current_memory_allocated) /
369
+ memory_used;
370
+ } else {
371
+ state.counters .erase (" provider_memory_allocated" );
372
+ }
373
+ }
332
374
375
+ waitForAllThreads (state);
333
376
freeAllocs (state);
334
377
waitForAllThreads (state);
335
378
if (tid == 0 ) {
@@ -342,20 +385,22 @@ class multiple_malloc_free_benchmark : public benchmark_interface<Size, Alloc> {
342
385
base::TearDown (state);
343
386
}
344
387
345
- void bench (benchmark::State &state) override {
388
+ void bench (benchmark::State &state) {
346
389
auto tid = state.thread_index ();
347
390
auto &allocation = allocations[tid];
391
+ auto &memuse = memused[tid];
348
392
for (int i = 0 ; i < allocsPerIterations; i++) {
349
393
auto &n = *next_iter[tid]++;
350
394
auto &alloc = allocation[n.offset ];
351
395
base::allocator.benchFree (alloc.ptr , alloc.size );
352
-
396
+ memuse -= alloc. size ;
353
397
alloc.size = n.size ;
354
398
alloc.ptr = base::allocator.benchAlloc (alloc.size );
355
399
356
400
if (alloc.ptr == NULL ) {
357
401
state.SkipWithError (" allocation failed" );
358
402
}
403
+ memuse += alloc.size ;
359
404
}
360
405
}
361
406
@@ -376,7 +421,9 @@ class multiple_malloc_free_benchmark : public benchmark_interface<Size, Alloc> {
376
421
auto tid = state.thread_index ();
377
422
auto &i = allocations[tid];
378
423
i.resize (max_allocs);
424
+ auto &memuse = memused[tid];
379
425
auto sizeGenerator = base::alloc_sizes[tid];
426
+
380
427
for (size_t j = 0 ; j < max_allocs; j++) {
381
428
auto size = sizeGenerator.nextSize ();
382
429
i[j].ptr = base::allocator.benchAlloc (size);
@@ -385,6 +432,7 @@ class multiple_malloc_free_benchmark : public benchmark_interface<Size, Alloc> {
385
432
return ;
386
433
}
387
434
i[j].size = size;
435
+ memuse += size;
388
436
}
389
437
}
390
438
@@ -394,6 +442,7 @@ class multiple_malloc_free_benchmark : public benchmark_interface<Size, Alloc> {
394
442
for (auto &j : i) {
395
443
if (j.ptr != NULL ) {
396
444
base::allocator.benchFree (j.ptr , j.size );
445
+ memused[tid] -= j.size ;
397
446
j.ptr = NULL ;
398
447
j.size = 0 ;
399
448
}
0 commit comments