forked from Green-Sky/tomato
Initial
This commit is contained in:
512
qoibench.c
Normal file
512
qoibench.c
Normal file
@ -0,0 +1,512 @@
|
||||
/*
|
||||
|
||||
Simple benchmark suite for png, stbi and qoi
|
||||
|
||||
Requires libpng, "stb_image.h" and "stb_image_write.h"
|
||||
Compile with:
|
||||
gcc qoibench.c -std=gnu99 -O3 -o qoibench
|
||||
|
||||
Dominic Szablewski - https://phoboslab.org
|
||||
|
||||
|
||||
-- LICENSE: The MIT License(MIT)
|
||||
|
||||
Copyright(c) 2021 Dominic Szablewski
|
||||
|
||||
Permission is hereby granted, free of charge, to any person obtaining a copy of
|
||||
this software and associated documentation files(the "Software"), to deal in
|
||||
the Software without restriction, including without limitation the rights to
|
||||
use, copy, modify, merge, publish, distribute, sublicense, and / or sell copies
|
||||
of the Software, and to permit persons to whom the Software is furnished to do
|
||||
so, subject to the following conditions :
|
||||
The above copyright notice and this permission notice shall be included in all
|
||||
copies or substantial portions of the Software.
|
||||
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.IN NO EVENT SHALL THE
|
||||
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
||||
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
||||
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
||||
SOFTWARE.
|
||||
|
||||
*/
|
||||
|
||||
#include <stdio.h>
|
||||
#include <dirent.h>
|
||||
#include <png.h>
|
||||
|
||||
#define STB_IMAGE_IMPLEMENTATION
|
||||
#define STBI_ONLY_PNG
|
||||
#define STBI_NO_LINEAR
|
||||
#include "stb_image.h"
|
||||
|
||||
#define STB_IMAGE_WRITE_IMPLEMENTATION
|
||||
#include "stb_image_write.h"
|
||||
|
||||
#define QOI_IMPLEMENTATION
|
||||
#include "qoi.h"
|
||||
|
||||
|
||||
|
||||
|
||||
// -----------------------------------------------------------------------------
|
||||
// Cross platform high resolution timer
|
||||
// From https://gist.github.com/ForeverZer0/0a4f80fc02b96e19380ebb7a3debbee5
|
||||
|
||||
#include <stdint.h>
|
||||
#if defined(__linux)
|
||||
#define HAVE_POSIX_TIMER
|
||||
#include <time.h>
|
||||
#ifdef CLOCK_MONOTONIC
|
||||
#define CLOCKID CLOCK_MONOTONIC
|
||||
#else
|
||||
#define CLOCKID CLOCK_REALTIME
|
||||
#endif
|
||||
#elif defined(__APPLE__)
|
||||
#define HAVE_MACH_TIMER
|
||||
#include <mach/mach_time.h>
|
||||
#elif defined(_WIN32)
|
||||
#define WIN32_LEAN_AND_MEAN
|
||||
#include <windows.h>
|
||||
#endif
|
||||
|
||||
static uint64_t ns() {
|
||||
static uint64_t is_init = 0;
|
||||
#if defined(__APPLE__)
|
||||
static mach_timebase_info_data_t info;
|
||||
if (0 == is_init) {
|
||||
mach_timebase_info(&info);
|
||||
is_init = 1;
|
||||
}
|
||||
uint64_t now;
|
||||
now = mach_absolute_time();
|
||||
now *= info.numer;
|
||||
now /= info.denom;
|
||||
return now;
|
||||
#elif defined(__linux)
|
||||
static struct timespec linux_rate;
|
||||
if (0 == is_init) {
|
||||
clock_getres(CLOCKID, &linux_rate);
|
||||
is_init = 1;
|
||||
}
|
||||
uint64_t now;
|
||||
struct timespec spec;
|
||||
clock_gettime(CLOCKID, &spec);
|
||||
now = spec.tv_sec * 1.0e9 + spec.tv_nsec;
|
||||
return now;
|
||||
#elif defined(_WIN32)
|
||||
static LARGE_INTEGER win_frequency;
|
||||
if (0 == is_init) {
|
||||
QueryPerformanceFrequency(&win_frequency);
|
||||
is_init = 1;
|
||||
}
|
||||
LARGE_INTEGER now;
|
||||
QueryPerformanceCounter(&now);
|
||||
return (uint64_t) ((1e9 * now.QuadPart) / win_frequency.QuadPart);
|
||||
#endif
|
||||
}
|
||||
|
||||
#define STRINGIFY(x) #x
|
||||
#define TOSTRING(x) STRINGIFY(x)
|
||||
#define ERROR(...) printf("abort at line " TOSTRING(__LINE__) ": " __VA_ARGS__); printf("\n"); exit(1)
|
||||
|
||||
|
||||
// -----------------------------------------------------------------------------
|
||||
// libpng encode/decode wrappers
|
||||
// Seriously, who thought this was a good abstraction for an API to read/write
|
||||
// images?
|
||||
|
||||
typedef struct {
|
||||
int size;
|
||||
int capacity;
|
||||
unsigned char *data;
|
||||
} libpng_write_t;
|
||||
|
||||
void libpng_encode_callback(png_structp png_ptr, png_bytep data, png_size_t length) {
|
||||
libpng_write_t *write_data = (libpng_write_t*)png_get_io_ptr(png_ptr);
|
||||
if (write_data->size + length >= write_data->capacity) {
|
||||
ERROR("PNG write");
|
||||
}
|
||||
memcpy(write_data->data + write_data->size, data, length);
|
||||
write_data->size += length;
|
||||
}
|
||||
|
||||
void *libpng_encode(void *pixels, int w, int h, int *out_len) {
|
||||
png_structp png = png_create_write_struct(PNG_LIBPNG_VER_STRING, NULL, NULL, NULL);
|
||||
if (!png) {
|
||||
ERROR("png_create_write_struct");
|
||||
}
|
||||
|
||||
png_infop info = png_create_info_struct(png);
|
||||
if (!info) {
|
||||
ERROR("png_create_info_struct");
|
||||
}
|
||||
|
||||
if (setjmp(png_jmpbuf(png))) {
|
||||
ERROR("png_jmpbuf");
|
||||
}
|
||||
|
||||
// Output is 8bit depth, RGBA format.
|
||||
png_set_IHDR(
|
||||
png,
|
||||
info,
|
||||
w, h,
|
||||
8,
|
||||
PNG_COLOR_TYPE_RGBA,
|
||||
PNG_INTERLACE_NONE,
|
||||
PNG_COMPRESSION_TYPE_DEFAULT,
|
||||
PNG_FILTER_TYPE_DEFAULT
|
||||
);
|
||||
|
||||
png_bytep row_pointers[h];
|
||||
for(int y = 0; y < h; y++){
|
||||
row_pointers[y] = ((unsigned char *)pixels + y * w * 4);
|
||||
}
|
||||
|
||||
libpng_write_t write_data = {
|
||||
.size = 0,
|
||||
.capacity = w * h * 4,
|
||||
.data = malloc(w * h * 4)
|
||||
};
|
||||
|
||||
png_set_rows(png, info, row_pointers);
|
||||
png_set_write_fn(png, &write_data, libpng_encode_callback, NULL);
|
||||
png_write_png(png, info, PNG_TRANSFORM_IDENTITY, NULL);
|
||||
|
||||
png_destroy_write_struct(&png, &info);
|
||||
|
||||
*out_len = write_data.size;
|
||||
return write_data.data;
|
||||
}
|
||||
|
||||
|
||||
typedef struct {
|
||||
int pos;
|
||||
int size;
|
||||
unsigned char *data;
|
||||
} libpng_read_t;
|
||||
|
||||
void png_decode_callback(png_structp png, png_bytep data, png_size_t length) {
|
||||
libpng_read_t *read_data = (libpng_read_t*)png_get_io_ptr(png);
|
||||
if (read_data->pos + length > read_data->size) {
|
||||
ERROR("PNG read %d bytes at pos %d (size: %d)", length, read_data->pos, read_data->size);
|
||||
}
|
||||
memcpy(data, read_data->data + read_data->pos, length);
|
||||
read_data->pos += length;
|
||||
}
|
||||
|
||||
void *libpng_decode(void *data, int size, int *out_w, int *out_h) {
|
||||
png_structp png = png_create_read_struct(PNG_LIBPNG_VER_STRING, NULL, NULL, NULL);
|
||||
if (!png) {
|
||||
ERROR("png_create_read_struct");
|
||||
}
|
||||
|
||||
png_infop info = png_create_info_struct(png);
|
||||
if (!info) {
|
||||
ERROR("png_create_info_struct");
|
||||
}
|
||||
|
||||
libpng_read_t read_data = {
|
||||
.pos = 0,
|
||||
.size = size,
|
||||
.data = data
|
||||
};
|
||||
|
||||
png_set_read_fn(png, &read_data, png_decode_callback);
|
||||
png_set_sig_bytes(png, 0);
|
||||
png_read_info(png, info);
|
||||
|
||||
png_uint_32 w, h;
|
||||
int bitDepth, colorType, interlaceType;
|
||||
png_get_IHDR(png, info, &w, &h, &bitDepth, &colorType, &interlaceType, NULL, NULL);
|
||||
|
||||
// 16 bit -> 8 bit
|
||||
png_set_strip_16(png);
|
||||
|
||||
// 1, 2, 4 bit -> 8 bit
|
||||
if (bitDepth < 8) {
|
||||
png_set_packing(png);
|
||||
}
|
||||
|
||||
if (colorType & PNG_COLOR_MASK_PALETTE) {
|
||||
png_set_expand(png);
|
||||
}
|
||||
|
||||
if (!(colorType & PNG_COLOR_MASK_COLOR)) {
|
||||
png_set_gray_to_rgb(png);
|
||||
}
|
||||
|
||||
// set paletted or RGB images with transparency to full alpha so we get RGBA
|
||||
if (png_get_valid(png, info, PNG_INFO_tRNS)) {
|
||||
png_set_tRNS_to_alpha(png);
|
||||
}
|
||||
|
||||
// make sure every pixel has an alpha value
|
||||
if (!(colorType & PNG_COLOR_MASK_ALPHA)) {
|
||||
png_set_filler(png, 255, PNG_FILLER_AFTER);
|
||||
}
|
||||
|
||||
png_read_update_info(png, info);
|
||||
|
||||
unsigned char* out = malloc(w * h * 4);
|
||||
*out_w = w;
|
||||
*out_h = h;
|
||||
|
||||
// png_uint_32 rowBytes = png_get_rowbytes(png, info);
|
||||
png_bytep row_pointers[h];
|
||||
for (png_uint_32 row = 0; row < h; row++ ) {
|
||||
row_pointers[row] = (png_bytep)(out + (row * w * 4));
|
||||
}
|
||||
|
||||
png_read_image(png, row_pointers);
|
||||
png_read_end(png, info);
|
||||
png_destroy_read_struct( &png, &info, NULL);
|
||||
|
||||
return out;
|
||||
}
|
||||
|
||||
|
||||
// -----------------------------------------------------------------------------
|
||||
// stb_image encode callback
|
||||
|
||||
void stbi_write_callback(void *context, void *data, int size) {
|
||||
int *encoded_size = (int *)context;
|
||||
*encoded_size += size;
|
||||
// In theory we'd need to do another malloc(), memcpy() and free() here to
|
||||
// be fair to the other decode functions...
|
||||
}
|
||||
|
||||
|
||||
// -----------------------------------------------------------------------------
|
||||
// function to load a whole file into memory
|
||||
|
||||
void *fload(const char *path, int *out_size) {
|
||||
FILE *fh = fopen(path, "rb");
|
||||
if (!fh) {
|
||||
ERROR("Can't open file");
|
||||
}
|
||||
|
||||
fseek(fh, 0, SEEK_END);
|
||||
int size = ftell(fh);
|
||||
fseek(fh, 0, SEEK_SET);
|
||||
|
||||
void *buffer = malloc(size);
|
||||
if (!buffer) {
|
||||
ERROR("Malloc for %d bytes failed", size);
|
||||
}
|
||||
|
||||
if (!fread(buffer, size, 1, fh)) {
|
||||
ERROR("Can't read file %s", path);
|
||||
}
|
||||
fclose(fh);
|
||||
|
||||
*out_size = size;
|
||||
return buffer;
|
||||
}
|
||||
|
||||
|
||||
// -----------------------------------------------------------------------------
|
||||
// benchmark runner
|
||||
|
||||
typedef struct {
|
||||
uint64_t size;
|
||||
uint64_t encode_time;
|
||||
uint64_t decode_time;
|
||||
} benchmark_lib_result_t;
|
||||
|
||||
typedef struct {
|
||||
uint64_t px;
|
||||
int w;
|
||||
int h;
|
||||
benchmark_lib_result_t libpng;
|
||||
benchmark_lib_result_t stbi;
|
||||
benchmark_lib_result_t qoi;
|
||||
} benchmark_result_t;
|
||||
|
||||
|
||||
// Run __VA_ARGS__ a number of times and meassure the time taken. The first
|
||||
// run is ignored.
|
||||
#define BENCHMARK_FN(RUNS, AVG_TIME, ...) \
|
||||
do { \
|
||||
uint64_t time = 0; \
|
||||
for (int i = 0; i <= RUNS; i++) { \
|
||||
uint64_t time_start = ns(); \
|
||||
__VA_ARGS__ \
|
||||
uint64_t time_end = ns(); \
|
||||
if (i > 0) { \
|
||||
time += time_end - time_start; \
|
||||
} \
|
||||
} \
|
||||
AVG_TIME = time / RUNS; \
|
||||
} while (0)
|
||||
|
||||
|
||||
benchmark_result_t benchmark_image(const char *path, int runs) {
|
||||
int encoded_png_size;
|
||||
int encoded_qoi_size;
|
||||
int w;
|
||||
int h;
|
||||
|
||||
// Load the encoded PNG, encoded QOI and raw pixels into memory
|
||||
void *pixels = (void *)stbi_load(path, &w, &h, NULL, 4);
|
||||
void *encoded_png = fload(path, &encoded_png_size);
|
||||
void *encoded_qoi = qoi_encode(pixels, w, h, 4, &encoded_qoi_size);
|
||||
|
||||
if (!pixels || !encoded_qoi || !encoded_png) {
|
||||
ERROR("Error decoding %s\n", path);
|
||||
}
|
||||
|
||||
benchmark_result_t res = {0};
|
||||
res.px = w * h;
|
||||
res.w = w;
|
||||
res.h = h;
|
||||
|
||||
|
||||
// Decoding
|
||||
|
||||
BENCHMARK_FN(runs, res.libpng.decode_time, {
|
||||
int dec_w, dec_h;
|
||||
void *dec_p = libpng_decode(encoded_png, encoded_png_size, &dec_w, &dec_h);
|
||||
free(dec_p);
|
||||
});
|
||||
|
||||
BENCHMARK_FN(runs, res.stbi.decode_time, {
|
||||
int dec_w, dec_h, dec_channels;
|
||||
void *dec_p = stbi_load_from_memory(encoded_png, encoded_png_size, &dec_w, &dec_h, &dec_channels, 4);
|
||||
free(dec_p);
|
||||
});
|
||||
|
||||
BENCHMARK_FN(runs, res.qoi.decode_time, {
|
||||
int dec_w, dec_h;
|
||||
void *dec_p = qoi_decode(encoded_qoi, encoded_qoi_size, &dec_w, &dec_h, 4);
|
||||
free(dec_p);
|
||||
});
|
||||
|
||||
|
||||
// Encoding
|
||||
|
||||
BENCHMARK_FN(runs, res.libpng.encode_time, {
|
||||
int enc_size;
|
||||
void *enc_p = libpng_encode(pixels, w, h, &enc_size);
|
||||
res.libpng.size = enc_size;
|
||||
free(enc_p);
|
||||
});
|
||||
|
||||
BENCHMARK_FN(runs, res.stbi.encode_time, {
|
||||
int enc_size = 0;
|
||||
stbi_write_png_to_func(stbi_write_callback, &enc_size, w, h, 4, pixels, 0);
|
||||
res.stbi.size = enc_size;
|
||||
});
|
||||
|
||||
BENCHMARK_FN(runs, res.qoi.encode_time, {
|
||||
int enc_size;
|
||||
void *enc_p = qoi_encode(pixels, w, h, 4, &enc_size);
|
||||
res.qoi.size = enc_size;
|
||||
free(enc_p);
|
||||
});
|
||||
|
||||
free(pixels);
|
||||
free(encoded_png);
|
||||
free(encoded_qoi);
|
||||
|
||||
return res;
|
||||
}
|
||||
|
||||
void benchmark_print_result(const char *head, benchmark_result_t res) {
|
||||
double px = res.px;
|
||||
printf("## %s size: %dx%d\n", head, res.w, res.h);
|
||||
printf(" decode ms encode ms decode mpps encode mpps size kb\n");
|
||||
printf(
|
||||
"libpng: %8.1f %8.1f %8.2f %8.2f %8d\n",
|
||||
(double)res.libpng.decode_time/1000000.0,
|
||||
(double)res.libpng.encode_time/1000000.0,
|
||||
(res.libpng.decode_time > 0 ? px / ((double)res.libpng.decode_time/1000.0) : 0),
|
||||
(res.libpng.encode_time > 0 ? px / ((double)res.libpng.encode_time/1000.0) : 0),
|
||||
res.libpng.size/1024
|
||||
);
|
||||
printf(
|
||||
"stbi: %8.1f %8.1f %8.2f %8.2f %8d\n",
|
||||
(double)res.stbi.decode_time/1000000.0,
|
||||
(double)res.stbi.encode_time/1000000.0,
|
||||
(res.stbi.decode_time > 0 ? px / ((double)res.stbi.decode_time/1000.0) : 0),
|
||||
(res.stbi.encode_time > 0 ? px / ((double)res.stbi.encode_time/1000.0) : 0),
|
||||
res.stbi.size/1024
|
||||
);
|
||||
printf(
|
||||
"qoi: %8.1f %8.1f %8.2f %8.2f %8d\n",
|
||||
(double)res.qoi.decode_time/1000000.0,
|
||||
(double)res.qoi.encode_time/1000000.0,
|
||||
(res.qoi.decode_time > 0 ? px / ((double)res.qoi.decode_time/1000.0) : 0),
|
||||
(res.qoi.encode_time > 0 ? px / ((double)res.qoi.encode_time/1000.0) : 0),
|
||||
res.qoi.size/1024
|
||||
);
|
||||
printf("\n");
|
||||
}
|
||||
|
||||
int main(int argc, char **argv) {
|
||||
if (argc < 3) {
|
||||
printf("Usage: qoibench <iterations> <directory>\n");
|
||||
printf("Example: qoibench 10 images/textures/\n");
|
||||
exit(1);
|
||||
}
|
||||
|
||||
float total_percentage = 0;
|
||||
int total_size = 0;
|
||||
|
||||
benchmark_result_t totals = {0};
|
||||
|
||||
int runs = atoi(argv[1]);
|
||||
DIR *dir = opendir(argv[2]);
|
||||
if (runs <=0) {
|
||||
runs = 1;
|
||||
}
|
||||
|
||||
if (!dir) {
|
||||
ERROR("Couldn't open directory %s", argv[2]);
|
||||
}
|
||||
|
||||
printf("## Benchmarking %s/*.png -- %d runs\n\n", argv[2], runs);
|
||||
struct dirent *file;
|
||||
int i;
|
||||
for (i = 0; dir && (file = readdir(dir)) != NULL; i++) {
|
||||
if (strcmp(file->d_name + strlen(file->d_name) - 4, ".png") != 0) {
|
||||
continue;
|
||||
}
|
||||
|
||||
char *file_path = malloc(strlen(file->d_name) + strlen(argv[2])+8);
|
||||
sprintf(file_path, "%s/%s", argv[2], file->d_name);
|
||||
|
||||
benchmark_result_t res = benchmark_image(file_path, runs);
|
||||
benchmark_print_result(file_path, res);
|
||||
|
||||
free(file_path);
|
||||
|
||||
|
||||
totals.px += res.px;
|
||||
totals.libpng.encode_time += res.libpng.encode_time;
|
||||
totals.libpng.decode_time += res.libpng.decode_time;
|
||||
totals.libpng.size += res.libpng.size;
|
||||
totals.stbi.encode_time += res.stbi.encode_time;
|
||||
totals.stbi.decode_time += res.stbi.decode_time;
|
||||
totals.stbi.size += res.stbi.size;
|
||||
totals.qoi.encode_time += res.qoi.encode_time;
|
||||
totals.qoi.decode_time += res.qoi.decode_time;
|
||||
totals.qoi.size += res.qoi.size;
|
||||
}
|
||||
closedir(dir);
|
||||
|
||||
totals.px /= i;
|
||||
totals.libpng.encode_time /= i;
|
||||
totals.libpng.decode_time /= i;
|
||||
totals.libpng.size /= i;
|
||||
totals.stbi.encode_time /= i;
|
||||
totals.stbi.decode_time /= i;
|
||||
totals.stbi.size /= i;
|
||||
totals.qoi.encode_time /= i;
|
||||
totals.qoi.decode_time /= i;
|
||||
totals.qoi.size /= i;
|
||||
|
||||
benchmark_print_result("Totals (AVG)", totals);
|
||||
|
||||
return 0;
|
||||
}
|
Reference in New Issue
Block a user