Linux kernel mirror (for testing) git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel os linux

perf bench mem: Move mem op parameters into a structure

Move benchmark function parameters in struct bench_params.

Reviewed-by: Namhyung Kim <namhyung@kernel.org>
Signed-off-by: Ankur Arora <ankur.a.arora@oracle.com>
Cc: Andrew Morton <akpm@linux-foundation.org>
Cc: Andy Lutomirski <luto@kernel.org>
Cc: Boris Ostrovsky <boris.ostrovsky@oracle.com>
Cc: Borislav Petkov <bp@alien8.de>
Cc: Dave Hansen <dave.hansen@linux.intel.com>
Cc: David Hildenbrand <david@redhat.com>
Cc: H. Peter Anvin <hpa@zytor.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Konrad Rzeszutek Wilk <konrad.wilk@oracle.com>
Cc: Mateusz Guzik <mjguzik@gmail.com>
Cc: Matthew Wilcox <willy@infradead.org>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Raghavendra K T <raghavendra.kt@amd.com>
Cc: Thomas Gleixner <tglx@linutronix.de>
Link: https://lore.kernel.org/r/20250917152418.4077386-4-ankur.a.arora@oracle.com
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>

authored by

Ankur Arora and committed by
Arnaldo Carvalho de Melo
dbf5dad1 07e25724

+34 -28
+34 -28
tools/perf/bench/mem-functions.c
··· 30 30 31 31 static const char *size_str = "1MB"; 32 32 static const char *function_str = "all"; 33 - static int nr_loops = 1; 33 + static unsigned int nr_loops = 1; 34 34 static bool use_cycles; 35 35 static int cycles_fd; 36 36 ··· 42 42 OPT_STRING('f', "function", &function_str, "all", 43 43 "Specify the function to run, \"all\" runs all available functions, \"help\" lists them"), 44 44 45 - OPT_INTEGER('l', "nr_loops", &nr_loops, 45 + OPT_UINTEGER('l', "nr_loops", &nr_loops, 46 46 "Specify the number of loops to run. (default: 1)"), 47 47 48 48 OPT_BOOLEAN('c', "cycles", &use_cycles, ··· 54 54 union bench_clock { 55 55 u64 cycles; 56 56 struct timeval tv; 57 + }; 58 + 59 + struct bench_params { 60 + size_t size; 61 + size_t size_total; 62 + unsigned int nr_loops; 57 63 }; 58 64 59 65 typedef void *(*memcpy_t)(void *, const void *, size_t); ··· 140 134 141 135 struct bench_mem_info { 142 136 const struct function *functions; 143 - union bench_clock (*do_op)(const struct function *r, size_t size, void *src, void *dst); 137 + union bench_clock (*do_op)(const struct function *r, struct bench_params *p, 138 + void *src, void *dst); 144 139 const char *const *usage; 145 140 bool alloc_src; 146 141 }; 147 142 148 - static void __bench_mem_function(struct bench_mem_info *info, int r_idx, size_t size, size_t size_total) 143 + static void __bench_mem_function(struct bench_mem_info *info, struct bench_params *p, 144 + int r_idx) 149 145 { 150 146 const struct function *r = &info->functions[r_idx]; 151 147 double result_bps = 0.0; 152 148 union bench_clock rt = { 0 }; 153 - void *src = NULL, *dst = zalloc(size); 149 + void *src = NULL, *dst = zalloc(p->size); 154 150 155 151 printf("# function '%s' (%s)\n", r->name, r->desc); 156 152 ··· 160 152 goto out_alloc_failed; 161 153 162 154 if (info->alloc_src) { 163 - src = zalloc(size); 155 + src = zalloc(p->size); 164 156 if (src == NULL) 165 157 goto out_alloc_failed; 166 158 } ··· 168 160 if (bench_format == BENCH_FORMAT_DEFAULT) 169 161 printf("# Copying %s bytes ...\n\n", size_str); 170 162 171 - rt = info->do_op(r, size, src, dst); 163 + rt = info->do_op(r, p, src, dst); 172 164 173 165 switch (bench_format) { 174 166 case BENCH_FORMAT_DEFAULT: 175 167 if (use_cycles) { 176 - printf(" %14lf cycles/byte\n", (double)rt.cycles/(double)size_total); 168 + printf(" %14lf cycles/byte\n", (double)rt.cycles/(double)p->size_total); 177 169 } else { 178 - result_bps = (double)size_total/timeval2double(&rt.tv); 170 + result_bps = (double)p->size_total/timeval2double(&rt.tv); 179 171 print_bps(result_bps); 180 172 } 181 173 break; 182 174 183 175 case BENCH_FORMAT_SIMPLE: 184 176 if (use_cycles) { 185 - printf("%lf\n", (double)rt.cycles/(double)size_total); 177 + printf("%lf\n", (double)rt.cycles/(double)p->size_total); 186 178 } else { 187 - result_bps = (double)size_total/timeval2double(&rt.tv); 179 + result_bps = (double)p->size_total/timeval2double(&rt.tv); 188 180 printf("%lf\n", result_bps); 189 181 } 190 182 break; ··· 206 198 static int bench_mem_common(int argc, const char **argv, struct bench_mem_info *info) 207 199 { 208 200 int i; 209 - size_t size; 210 - size_t size_total; 201 + struct bench_params p = { 0 }; 211 202 212 203 argc = parse_options(argc, argv, options, info->usage, 0); 213 204 ··· 218 211 } 219 212 } 220 213 221 - size = (size_t)perf_atoll((char *)size_str); 222 - size_total = size * nr_loops; 214 + p.nr_loops = nr_loops; 215 + p.size = (size_t)perf_atoll((char *)size_str); 223 216 224 - if ((s64)size <= 0) { 217 + if ((s64)p.size <= 0) { 225 218 fprintf(stderr, "Invalid size:%s\n", size_str); 226 219 return 1; 227 220 } 221 + p.size_total = p.size * p.nr_loops; 228 222 229 223 if (!strncmp(function_str, "all", 3)) { 230 224 for (i = 0; info->functions[i].name; i++) 231 - __bench_mem_function(info, i, size, size_total); 225 + __bench_mem_function(info, &p, i); 232 226 return 0; 233 227 } 234 228 ··· 248 240 return 1; 249 241 } 250 242 251 - __bench_mem_function(info, i, size, size_total); 243 + __bench_mem_function(info, &p, i); 252 244 253 245 return 0; 254 246 } ··· 265 257 fn(dst, src, size); 266 258 } 267 259 268 - static union bench_clock do_memcpy(const struct function *r, size_t size, 260 + static union bench_clock do_memcpy(const struct function *r, struct bench_params *p, 269 261 void *src, void *dst) 270 262 { 271 263 union bench_clock start, end; 272 264 memcpy_t fn = r->fn.memcpy; 273 - int i; 274 265 275 - memcpy_prefault(fn, size, src, dst); 266 + memcpy_prefault(fn, p->size, src, dst); 276 267 277 268 clock_get(&start); 278 - for (i = 0; i < nr_loops; ++i) 279 - fn(dst, src, size); 269 + for (unsigned int i = 0; i < p->nr_loops; ++i) 270 + fn(dst, src, p->size); 280 271 clock_get(&end); 281 272 282 273 return clock_diff(&start, &end); ··· 312 305 return bench_mem_common(argc, argv, &info); 313 306 } 314 307 315 - static union bench_clock do_memset(const struct function *r, size_t size, 308 + static union bench_clock do_memset(const struct function *r, struct bench_params *p, 316 309 void *src __maybe_unused, void *dst) 317 310 { 318 311 union bench_clock start, end; 319 312 memset_t fn = r->fn.memset; 320 - int i; 321 313 322 314 /* 323 315 * We prefault the freshly allocated memory range here, 324 316 * to not measure page fault overhead: 325 317 */ 326 - fn(dst, -1, size); 318 + fn(dst, -1, p->size); 327 319 328 320 clock_get(&start); 329 - for (i = 0; i < nr_loops; ++i) 330 - fn(dst, i, size); 321 + for (unsigned int i = 0; i < p->nr_loops; ++i) 322 + fn(dst, i, p->size); 331 323 clock_get(&end); 332 324 333 325 return clock_diff(&start, &end);