diff --git a/benchmarks/bench.c b/benchmarks/bench.c new file mode 100644 index 0000000..6872fef --- /dev/null +++ b/benchmarks/bench.c @@ -0,0 +1,332 @@ +#include "test_common.h" +#include +#include +#include +#include + +typedef struct { + double time_ms; + double pixels_per_sec; + double megabytes_per_sec; + size_t input_bytes; + size_t output_bytes; +} BenchResult; + +static double get_time_us(void) { + struct timeval tv; + gettimeofday(&tv, NULL); + return tv.tv_sec * 1000000.0 + tv.tv_usec; +} + +static void calculate_bench_metrics(const char *name, int iterations, BenchResult *r) { + if (strstr(name, "create_uniform") != NULL) { + r->input_bytes = 0; + r->output_bytes = 16 * 16 * 4; + } else if (strstr(name, "create_gradient_256") != NULL) { + r->input_bytes = 0; + r->output_bytes = 256 * 256 * 4; + } else if (strstr(name, "create_noise_1024") != NULL) { + r->input_bytes = 0; + r->output_bytes = 1024 * 1024 * 4; + } else if (strstr(name, "downsample_uniform_16x16") != NULL) { + r->input_bytes = 16 * 16 * 4; + r->output_bytes = 8 * 8 * 4; + } else if (strstr(name, "downsample_gradient_64x64") != NULL) { + r->input_bytes = 64 * 64 * 4; + r->output_bytes = 32 * 32 * 4; + } else if (strstr(name, "downsample_gradient_256x256") != NULL) { + r->input_bytes = 256 * 256 * 4; + r->output_bytes = 128 * 128 * 4; + } else if (strstr(name, "downsample_gradient_1024x1024") != NULL) { + r->input_bytes = 1024 * 1024 * 4; + r->output_bytes = 512 * 512 * 4; + } else if (strstr(name, "downsample_noise_512x512") != NULL) { + r->input_bytes = 512 * 512 * 4; + r->output_bytes = 128 * 128 * 4; + } else if (strstr(name, "downsample_noise_1024x1024") != NULL) { + r->input_bytes = 1024 * 1024 * 4; + r->output_bytes = 256 * 256 * 4; + } else if (strstr(name, "downsample_noise_1920x1080") != NULL) { + r->input_bytes = 1920 * 1080 * 4; + r->output_bytes = 960 * 540 * 4; + } else if (strstr(name, "downsample_noise_3840x2160") != NULL) { + r->input_bytes = 3840 * 2160 * 4; + r->output_bytes = 1920 * 1080 * 4; + } else if (strstr(name, "downsample_noise_4096x4096") != NULL) { + r->input_bytes = 4096 * 4096 * 4; + r->output_bytes = 1024 * 1024 * 4; + } else if (strstr(name, "downsample_checkerboard_100x100") != NULL) { + r->input_bytes = 100 * 100 * 4; + r->output_bytes = 50 * 50 * 4; + } else if (strstr(name, "downsample_checkerboard_256x256") != NULL) { + r->input_bytes = 256 * 256 * 4; + r->output_bytes = 128 * 128 * 4; + } else { + r->input_bytes = 0; + r->output_bytes = 0; + } + r->input_bytes *= (size_t)iterations; + r->output_bytes *= (size_t)iterations; +} + +static void run_bench(double (*fn)(void), int iterations, double *elapsed_ms) { + double start = get_time_us(); + for (int i = 0; i < iterations; i++) { + fn(); + } + *elapsed_ms = (get_time_us() - start) / 1000.0; +} + +static double bench_create_uniform_16x16(void) { + for (int i = 0; i < 5000; i++) { + uint8_t *img = create_uniform_image(16, 16, 128, 128, 128); + free(img); + } + return 0; +} + +static double bench_create_gradient_256x256(void) { + for (int i = 0; i < 500; i++) { + uint8_t *img = create_gradient_image(256, 256); + free(img); + } + return 0; +} + +static double bench_create_noise_1024x1024(void) { + for (int i = 0; i < 50; i++) { + uint8_t *img = create_noise_image(1024, 1024, 42); + free(img); + } + return 0; +} + +static double bench_downsample_uniform_16x16(void) { + uint8_t *src = create_uniform_image(16, 16, 128, 128, 128); + int dw, dh; + + for (int i = 0; i < 2000; i++) { + uint8_t *dst = downsample_image(src, 16, 16, 4, &dw, &dh, 0.5f); + free(dst); + } + + free(src); + return 0; +} + +static double bench_downsample_gradient_64x64(void) { + uint8_t *src = create_gradient_image(64, 64); + int dw, dh; + + for (int i = 0; i < 500; i++) { + uint8_t *dst = downsample_image(src, 64, 64, 4, &dw, &dh, 0.5f); + free(dst); + } + + free(src); + return 0; +} + +static double bench_downsample_gradient_256x256(void) { + uint8_t *src = create_gradient_image(256, 256); + int dw, dh; + + for (int i = 0; i < 200; i++) { + uint8_t *dst = downsample_image(src, 256, 256, 4, &dw, &dh, 0.5f); + free(dst); + } + + free(src); + return 0; +} + +static double bench_downsample_gradient_1024x1024(void) { + uint8_t *src = create_gradient_image(1024, 1024); + int dw, dh; + + for (int i = 0; i < 20; i++) { + uint8_t *dst = downsample_image(src, 1024, 1024, 4, &dw, &dh, 0.5f); + free(dst); + } + + free(src); + return 0; +} + +static double bench_downsample_noise_512x512(void) { + uint8_t *src = create_noise_image(512, 512, 42); + int dw, dh; + + for (int i = 0; i < 50; i++) { + uint8_t *dst = downsample_image(src, 512, 512, 4, &dw, &dh, 0.25f); + free(dst); + } + + free(src); + return 0; +} + +static double bench_downsample_noise_1024x1024(void) { + uint8_t *src = create_noise_image(1024, 1024, 123); + int dw, dh; + + for (int i = 0; i < 15; i++) { + uint8_t *dst = downsample_image(src, 1024, 1024, 4, &dw, &dh, 0.25f); + free(dst); + } + + free(src); + return 0; +} + +static double bench_downsample_noise_1920x1080(void) { + uint8_t *src = create_noise_image(1920, 1080, 456); + int dw, dh; + + for (int i = 0; i < 5; i++) { + uint8_t *dst = downsample_image(src, 1920, 1080, 4, &dw, &dh, 0.5f); + free(dst); + } + + free(src); + return 0; +} + +static double bench_downsample_noise_3840x2160(void) { + uint8_t *src = create_noise_image(3840, 2160, 789); + int dw, dh; + + for (int i = 0; i < 2; i++) { + uint8_t *dst = downsample_image(src, 3840, 2160, 4, &dw, &dh, 0.5f); + free(dst); + } + + free(src); + return 0; +} + +static double bench_downsample_noise_4096x4096(void) { + uint8_t *src = create_noise_image(4096, 4096, 456); + int dw, dh; + + for (int i = 0; i < 2; i++) { + uint8_t *dst = downsample_image(src, 4096, 4096, 4, &dw, &dh, 0.25f); + free(dst); + } + + free(src); + return 0; +} + +static double bench_downsample_checkerboard_100x100(void) { + uint8_t *src = create_checkerboard(100, 100, 10); + int dw, dh; + + for (int i = 0; i < 200; i++) { + uint8_t *dst = downsample_image(src, 100, 100, 4, &dw, &dh, 0.5f); + free(dst); + } + + free(src); + return 0; +} + +static double bench_downsample_checkerboard_256x256(void) { + uint8_t *src = create_checkerboard(256, 256, 16); + int dw, dh; + + for (int i = 0; i < 100; i++) { + uint8_t *dst = downsample_image(src, 256, 256, 4, &dw, &dh, 0.5f); + free(dst); + } + + free(src); + return 0; +} + +typedef struct { + const char *name; + double (*fn)(void); +} BenchDef; + +static BenchDef benchmarks[] = { + {"create_uniform_16x16", bench_create_uniform_16x16}, + {"create_gradient_256x256", bench_create_gradient_256x256}, + {"create_noise_1024x1024", bench_create_noise_1024x1024}, + {"downsample_uniform_16x16_0.5x", bench_downsample_uniform_16x16}, + {"downsample_gradient_64x64_0.5x", bench_downsample_gradient_64x64}, + {"downsample_gradient_256x256_0.5x", bench_downsample_gradient_256x256}, + {"downsample_gradient_1024x1024_0.5x", bench_downsample_gradient_1024x1024}, + {"downsample_noise_512x512_0.25x", bench_downsample_noise_512x512}, + {"downsample_noise_1024x1024_0.25x", bench_downsample_noise_1024x1024}, + {"downsample_noise_1920x1080_0.5x", bench_downsample_noise_1920x1080}, + {"downsample_noise_3840x2160_0.5x", bench_downsample_noise_3840x2160}, + {"downsample_noise_4096x4096_0.25x", bench_downsample_noise_4096x4096}, + {"downsample_checkerboard_100x100_0.5x", bench_downsample_checkerboard_100x100}, + {"downsample_checkerboard_256x256_0.5x", bench_downsample_checkerboard_256x256}, +}; + +static int benchmark_iterations[] = { + 5000, 500, 50, 2000, 500, 200, 20, 50, 15, 5, 2, 2, 200, 100 +}; + +int main(int argc, char **argv) { + int csv_output = 0; + + for (int i = 1; i < argc; i++) { + if (strcmp(argv[i], "--csv") == 0) { + csv_output = 1; + } + } + + if (csv_output) { + printf("name,time_ms,pixels_per_sec,megabytes_per_sec,iterations\n"); + } else { + printf("Chroma Performance Benchmarks\n"); + printf("=============================\n\n"); + printf(" %-42s %16s %22s %19s\n", "Benchmark", "Time (ms)", "Pixels/sec", "MB/sec"); + printf(" %-42s %16s %22s %19s\n", "-----------------------------------------", "--------------", "-----------------", "--------------"); + } + + int num_benchmarks = sizeof(benchmarks) / sizeof(benchmarks[0]); + int max_name_len = 0; + for (int i = 0; i < num_benchmarks; i++) { + int len = strlen(benchmarks[i].name); + if (len > max_name_len) max_name_len = len; + } + + for (int i = 0; i < num_benchmarks; i++) { + BenchResult result = {0}; + calculate_bench_metrics(benchmarks[i].name, benchmark_iterations[i], &result); + + double elapsed_ms; + run_bench(benchmarks[i].fn, benchmark_iterations[i], &elapsed_ms); + + size_t total_pixels = result.input_bytes > 0 ? result.input_bytes / 4 : 0; + result.time_ms = elapsed_ms; + if (total_pixels > 0 && elapsed_ms > 0) { + result.pixels_per_sec = total_pixels / (elapsed_ms / 1000.0); + } + double total_mb = (result.input_bytes + result.output_bytes) / (1024.0 * 1024.0); + if (total_mb > 0 && elapsed_ms > 0) { + result.megabytes_per_sec = total_mb / (elapsed_ms / 1000.0); + } + + if (csv_output) { + printf("%s,%.3f,%.0f,%.2f,%d\n", + benchmarks[i].name, result.time_ms, result.pixels_per_sec, + result.megabytes_per_sec, benchmark_iterations[i]); + } else { + printf(" %-42s %16.3f %22.0f %19.2f\n", + benchmarks[i].name, result.time_ms, + result.pixels_per_sec, result.megabytes_per_sec); + } + } + + if (!csv_output) { + printf("\n"); + } + + (void)argc; + return 0; +}