/* stb_resample - v0.1 - public domain image resampling no warranty implied; use at your own risk Do this: #define STB_RESAMPLE_IMPLEMENTATION before you include this file in *one* C or C++ file to create the implementation. #define STBR_ASSERT(x) to avoid using assert.h. Latest revisions: See end of file for full revision history. Initial implementation by Jorge L Rodriguez */ #ifndef STBR_INCLUDE_STB_RESAMPLE_H #define STBR_INCLUDE_STB_RESAMPLE_H // Basic usage: // result = stbr_resize(input_data, input_w, input_h, 0, output_data, output_w, output_h, 0, channels, alpha_channel, STBR_TYPE_UINT8, STBR_FILTER_BILINEAR, STBR_EDGE_CLAMP, STBR_COLORSPACE_SRGB); // // input_data is your supplied texels. // output_data will be the resized texels. It should be of size output_w * output_h * input_components (or output_h * output_stride if you provided a stride.) // If input_stride or output_stride is 0 (as in this example) the stride will be automatically calculated as width*components. // Returned result is 1 for success or 0 in case of an error. typedef enum { STBR_FILTER_NEAREST = 1, } stbr_filter; typedef enum { STBR_EDGE_CLAMP = 1, } stbr_edge; typedef enum { STBR_COLORSPACE_LINEAR = 1, STBR_COLORSPACE_SRGB = 2, } stbr_colorspace; typedef enum { STBR_TYPE_UINT8 = 1, } stbr_type; typedef unsigned char stbr_uc; typedef unsigned int stbr_size_t; // to avoid including a header for size_t #ifdef __cplusplus extern "C" { #endif #ifdef STB_RESAMPLE_STATIC #define STBRDEF static #else #define STBRDEF extern #endif ////////////////////////////////////////////////////////////////////////////// // // PRIMARY API - resize an image // STBRDEF stbr_size_t stbr_calculate_memory(int input_w, int input_h, int input_stride_in_bytes, int output_w, int output_h, int output_stride_in_bytes, int channels, stbr_filter filter); STBRDEF int stbr_resize_arbitrary(const void* input_data, int input_w, int input_h, int input_stride_in_bytes, void* output_data, int output_w, int output_h, int output_stride_in_bytes, //int channels, int alpha_channel, stbr_type type, stbr_filter filter, stbr_edge edge, stbr_colorspace colorspace, int channels, stbr_type type, stbr_filter filter, void* tempmem, stbr_size_t tempmem_size_in_bytes); #ifdef __cplusplus } #endif // // //// end header file ///////////////////////////////////////////////////// #endif // STBR_INCLUDE_STB_RESAMPLE_H #ifdef STB_RESIZE_IMPLEMENTATION #ifndef STBR_ASSERT #include #define STBR_ASSERT(x) assert(x) #endif #ifdef STBR_DEBUG #define STBR_DEBUG_ASSERT STBR_ASSERT #else #define STBR_DEBUG_ASSERT #endif // If you hit this it means I haven't done it yet. #define STBR_UNIMPLEMENTED(x) STBR_ASSERT(!(x)) #ifdef STBR_DEBUG_OVERWRITE_TEST #include #endif #include #ifndef _MSC_VER #ifdef __cplusplus #define stbr_inline inline #else #define stbr_inline #endif #else #define stbr_inline __forceinline #endif #ifdef _MSC_VER typedef unsigned short stbr__uint16; typedef signed short stbr__int16; typedef unsigned int stbr__uint32; typedef signed int stbr__int32; #else #include typedef uint16_t stbr__uint16; typedef int16_t stbr__int16; typedef uint32_t stbr__uint32; typedef int32_t stbr__int32; #endif // should produce compiler error if size is wrong typedef unsigned char stbr__validate_uint32[sizeof(stbr__uint32) == 4 ? 1 : -1]; #ifdef _MSC_VER #define STBR_NOTUSED(v) (void)(v) #else #define STBR_NOTUSED(v) (void)sizeof(v) #endif #define STBR_ARRAY_SIZE(a) (sizeof((a))/sizeof((a)[0])) // Kernel function centered at 0 typedef float (stbr__kernel_fn)(float x); typedef struct { stbr__kernel_fn* kernel; float support; } stbr__filter_info; typedef struct { int n0; // First contributing source texel int n1; // Last contributing source texel } stbr__contributors; typedef struct { const void* input_data; int input_w; int input_h; int input_stride_bytes; void* output_data; int output_w; int output_h; int output_stride_bytes; int channels; stbr_type type; stbr_filter filter; int total_coefficients; int kernel_texel_width; stbr__contributors* horizontal_contributors; float* horizontal_coefficients; stbr__contributors vertical_contributors; float* vertical_coefficients; float* decode_buffer; int ring_buffer_length; // The length of an individual entry in the ring buffer. The total number of ring buffers is kernel_texel_width int ring_buffer_first_scanline; int ring_buffer_last_scanline; int ring_buffer_begin_index; float* ring_buffer; float* encode_buffer; // A temporary buffer to store floats so we don't lose precision while we do multiply-adds. } stbr__info; float stbr__filter_nearest(float x) { if (fabs(x) <= 0.5) return 1; else return 0; } stbr__filter_info stbr__filter_info_table[] = { { NULL, 0.0f }, { stbr__filter_nearest, 0.5f }, }; // This is the maximum number of input samples that can affect an output sample // with the given filter int stbr__get_filter_texel_width(stbr_filter filter, int upsample) { STBR_UNIMPLEMENTED(!upsample); STBR_ASSERT(filter != 0); STBR_ASSERT(filter < STBR_ARRAY_SIZE(stbr__filter_info_table)); return (int)ceil(stbr__filter_info_table[filter].support * 2); } int stbr__get_total_coefficients(stbr_filter filter, int input_w, int output_w) { return output_w * stbr__get_filter_texel_width(filter, output_w > input_w ? 1 : 0); } stbr_inline static stbr__contributors* stbr__get_contributor(stbr__info* stbr_info, int n) { STBR_DEBUG_ASSERT(n >= 0 && n < stbr_info->output_w); return &stbr_info->horizontal_contributors[n]; } stbr_inline static float* stbr__get_coefficient(stbr__info* stbr_info, int n, int c) { return &stbr_info->horizontal_coefficients[stbr_info->kernel_texel_width*n + c]; } // What input texels contribute to this output texel? static void stbr__calculate_sample_range(int n, float out_filter_radius, float scale_ratio, int* in_first_texel, int* in_last_texel, float* in_center_of_out) { // What input texels contribute to this output texel? float out_texel_center = (float)n + 0.5f; float out_texel_influence_lowerbound = out_texel_center - out_filter_radius; float out_texel_influence_upperbound = out_texel_center + out_filter_radius; float in_texel_influence_lowerbound = out_texel_influence_lowerbound / scale_ratio; float in_texel_influence_upperbound = out_texel_influence_upperbound / scale_ratio; *in_center_of_out = out_texel_center / scale_ratio; *in_first_texel = (int)(floor(in_texel_influence_lowerbound + 0.5)); *in_last_texel = (int)(floor(in_texel_influence_upperbound - 0.5)); } static void stbr__calculate_coefficients(stbr__info* stbr_info, int in_first_texel, int in_last_texel, float in_center_of_out, int n, stbr__contributors* contributor, float* coefficient_group) { int i; float total_filter = 0; float filter_scale; STBR_DEBUG_ASSERT(in_last_texel - in_first_texel <= stbr_info->kernel_texel_width); STBR_DEBUG_ASSERT(in_first_texel >= 0); STBR_DEBUG_ASSERT(in_last_texel < stbr_info->input_w); contributor->n0 = in_first_texel; contributor->n1 = in_last_texel; for (i = 0; i <= in_last_texel - in_first_texel; i++) { float in_texel_center = (float)(i + in_first_texel) + 0.5f; total_filter += coefficient_group[i] = stbr__filter_info_table[stbr_info->filter].kernel(in_center_of_out - in_texel_center); } STBR_DEBUG_ASSERT(total_filter > 0); STBR_DEBUG_ASSERT(fabs(1 - total_filter) < 0.1f); // Make sure it's not way off. // Make sure the sum of all coefficients is 1. filter_scale = 1 / total_filter; for (i = 0; i <= in_last_texel - in_first_texel; i++) coefficient_group[i] *= filter_scale; } // Each scan line uses the same kernel values so we should calculate the kernel // values once and then we can use them for every scan line. static void stbr__calculate_horizontal_filters(stbr__info* stbr_info) { int n; float scale_ratio = (float)stbr_info->output_w / stbr_info->input_w; float out_pixels_radius = stbr__filter_info_table[stbr_info->filter].support * scale_ratio; STBR_UNIMPLEMENTED(stbr_info->output_w < stbr_info->input_w); for (n = 0; n < stbr_info->output_w; n++) { float in_center_of_out; // Center of the current out texel in the in texel space int in_first_texel, in_last_texel; stbr__calculate_sample_range(n, out_pixels_radius, scale_ratio, &in_first_texel, &in_last_texel, &in_center_of_out); stbr__calculate_coefficients(stbr_info, in_first_texel, in_last_texel, in_center_of_out, n, stbr__get_contributor(stbr_info, n), stbr__get_coefficient(stbr_info, n, 0)); } } static float* stbr__get_decode_buffer_index(stbr__info* stbr_info, int x, int c) { STBR_DEBUG_ASSERT(x >= 0 && x < stbr_info->input_w); STBR_DEBUG_ASSERT(c >= 0 && c < stbr_info->channels); return &stbr_info->decode_buffer[x * stbr_info->channels + c]; } static void stbr__decode_scanline(stbr__info* stbr_info, int n) { int x, c; int channels = stbr_info->channels; int input_w = stbr_info->input_w; int input_stride_bytes = stbr_info->input_stride_bytes; const void* input_data = stbr_info->input_data; float* decode_buffer = stbr_info->decode_buffer; int in_buffer_row_index = n * input_stride_bytes; STBR_UNIMPLEMENTED(stbr_info->type != STBR_TYPE_UINT8); for (x = 0; x < input_w; x++) { int texel_index = x * channels; for (c = 0; c < channels; c++) { int channel_index = x * channels + c; int in_buffer_index = in_buffer_row_index + channel_index; decode_buffer[channel_index] = ((float)((const unsigned char*)input_data)[in_buffer_index]) / 255; } } } static float* stbr__get_ring_buffer_index(float* ring_buffer, int index, int ring_buffer_length) { return &ring_buffer[index * ring_buffer_length]; } static void stbr__resample_horizontal(stbr__info* stbr_info, int n) { int x, k, c; int output_w = stbr_info->output_w; int kernel_texel_width = stbr_info->kernel_texel_width; int channels = stbr_info->channels; float* decode_buffer = stbr_info->decode_buffer; stbr__contributors* horizontal_contributors = stbr_info->horizontal_contributors; float* horizontal_coefficients = stbr_info->horizontal_coefficients; int ring_buffer_index; float* ring_buffer; if (stbr_info->ring_buffer_begin_index < 0) ring_buffer_index = stbr_info->ring_buffer_begin_index = 0; else { ring_buffer_index = (stbr_info->ring_buffer_begin_index + (stbr_info->ring_buffer_last_scanline - stbr_info->ring_buffer_first_scanline) + 1) % stbr_info->kernel_texel_width; STBR_DEBUG_ASSERT(ring_buffer_index != stbr_info->ring_buffer_begin_index); } ring_buffer = stbr__get_ring_buffer_index(stbr_info->ring_buffer, ring_buffer_index, stbr_info->ring_buffer_length); memset(ring_buffer, 0, stbr_info->ring_buffer_length); for (x = 0; x < output_w; x++) { int n0 = horizontal_contributors[x].n0; int n1 = horizontal_contributors[x].n1; int out_texel_index = x * channels; int coefficient_group_index = x * kernel_texel_width; int coefficient_counter = 0; STBR_DEBUG_ASSERT(n1 >= n0); for (k = n0; k <= n1; k++) { int coefficient_index = coefficient_group_index + (coefficient_counter++); int in_texel_index = k * channels; float coefficient = horizontal_coefficients[coefficient_index]; if (!coefficient) continue; for (c = 0; c < channels; c++) ring_buffer[out_texel_index + c] += decode_buffer[in_texel_index + c] * coefficient; } } stbr_info->ring_buffer_last_scanline = n; } static void stbr__decode_and_resample(stbr__info* stbr_info, int n) { if (n >= stbr_info->input_h) { STBR_UNIMPLEMENTED("ring buffer overran source height"); return; } // Decode the nth scanline from the source image into the decode buffer. stbr__decode_scanline(stbr_info, n); // Now resample it into the ring buffer. stbr__resample_horizontal(stbr_info, n); // Now it's sitting in the ring buffer ready to be used as source for the vertical sampling. } // Get the specified scan line from the ring buffer. static float* stbr__get_ring_buffer_scanline(int get_scanline, float* ring_buffer, int begin_index, int first_scanline, int ring_buffer_size, int ring_buffer_length) { int ring_buffer_index = (begin_index + (get_scanline - first_scanline)) % ring_buffer_size; return stbr__get_ring_buffer_index(ring_buffer, ring_buffer_index, ring_buffer_length); } static void stbr__resample_vertical(stbr__info* stbr_info, int n, int in_first_scanline, int in_last_scanline, float in_center_of_out) { int x, k, c; int output_w = stbr_info->output_w; stbr__contributors* vertical_contributors = &stbr_info->vertical_contributors; float* vertical_coefficients = stbr_info->vertical_coefficients; int channels = stbr_info->channels; int kernel_texel_width = stbr_info->kernel_texel_width; void* output_data = stbr_info->output_data; float* encode_buffer = stbr_info->encode_buffer; float* ring_buffer = stbr_info->ring_buffer; int ring_buffer_begin_index = stbr_info->ring_buffer_begin_index; int ring_buffer_first_scanline = stbr_info->ring_buffer_first_scanline; int ring_buffer_last_scanline = stbr_info->ring_buffer_last_scanline; int ring_buffer_length = stbr_info->ring_buffer_length; STBR_UNIMPLEMENTED(stbr_info->type != STBR_TYPE_UINT8); stbr__calculate_coefficients(stbr_info, in_first_scanline, in_last_scanline, in_center_of_out, n, vertical_contributors, vertical_coefficients); int n0 = vertical_contributors->n0; int n1 = vertical_contributors->n1; int output_row_index = n * stbr_info->output_stride_bytes; STBR_DEBUG_ASSERT(n0 >= in_first_scanline); STBR_DEBUG_ASSERT(n1 <= in_last_scanline); for (x = 0; x < output_w; x++) { int in_texel_index = x * channels; int out_texel_index = output_row_index + x * channels; int coefficient_counter = 0; STBR_DEBUG_ASSERT(n1 >= n0); memset(encode_buffer, 0, sizeof(float) * channels); for (k = n0; k <= n1; k++) { int coefficient_index = coefficient_counter++; float* ring_buffer_entry = stbr__get_ring_buffer_scanline(k, ring_buffer, ring_buffer_begin_index, ring_buffer_first_scanline, kernel_texel_width, ring_buffer_length); float coefficient = vertical_coefficients[coefficient_index]; if (!coefficient) continue; for (c = 0; c < channels; c++) encode_buffer[c] += ring_buffer_entry[in_texel_index + c] * coefficient; } for (c = 0; c < channels; c++) ((unsigned char*)output_data)[out_texel_index + c] = (unsigned char)(encode_buffer[c] * 255); } } STBRDEF int stbr_resize_arbitrary(const void* input_data, int input_w, int input_h, int input_stride_in_bytes, void* output_data, int output_w, int output_h, int output_stride_in_bytes, int channels, stbr_type type, stbr_filter filter, void* tempmem, stbr_size_t tempmem_size_in_bytes) { int y; int width_stride_input = input_stride_in_bytes ? input_stride_in_bytes : channels * input_w; int width_stride_output = output_stride_in_bytes ? output_stride_in_bytes : channels * output_w; #ifdef STBR_DEBUG_OVERWRITE_TEST #define OVERWRITE_ARRAY_SIZE 64 unsigned char overwrite_output_pre[OVERWRITE_ARRAY_SIZE]; unsigned char overwrite_tempmem_pre[OVERWRITE_ARRAY_SIZE]; stbr_size_t begin_forbidden = width_stride_output * (output_h - 1) + output_w * channels; memcpy(overwrite_output_pre, &((unsigned char*)output_data)[begin_forbidden], OVERWRITE_ARRAY_SIZE); memcpy(overwrite_tempmem_pre, &((unsigned char*)tempmem)[tempmem_size_in_bytes], OVERWRITE_ARRAY_SIZE); #endif STBR_UNIMPLEMENTED(type != STBR_TYPE_UINT8); STBR_ASSERT(filter != 0); STBR_ASSERT(filter < STBR_ARRAY_SIZE(stbr__filter_info_table)); if (!tempmem) return 0; if (tempmem_size_in_bytes < stbr_calculate_memory(input_w, input_h, input_stride_in_bytes, output_w, output_h, output_stride_in_bytes, channels, STBR_FILTER_NEAREST)) return 0; memset(tempmem, 0, tempmem_size_in_bytes); stbr__info* stbr_info = (stbr__info*)tempmem; stbr_info->input_data = input_data; stbr_info->input_w = input_w; stbr_info->input_h = input_h; stbr_info->input_stride_bytes = width_stride_input; stbr_info->output_data = output_data; stbr_info->output_w = output_w; stbr_info->output_h = output_h; stbr_info->output_stride_bytes = width_stride_output; stbr_info->channels = channels; stbr_info->type = type; stbr_info->filter = filter; stbr_info->total_coefficients = stbr__get_total_coefficients(filter, input_w, output_w); stbr_info->kernel_texel_width = stbr__get_filter_texel_width(filter, output_w > input_w ? 1 : 0); stbr_info->ring_buffer_length = output_w * channels * sizeof(float); #define STBR__NEXT_MEMPTR(current, old, newtype) (newtype*)(((unsigned char*)current) + old) stbr_info->horizontal_contributors = STBR__NEXT_MEMPTR(stbr_info, sizeof(stbr__info), stbr__contributors); stbr_info->horizontal_coefficients = STBR__NEXT_MEMPTR(stbr_info->horizontal_contributors, output_w * sizeof(stbr__contributors), float); stbr_info->vertical_coefficients = STBR__NEXT_MEMPTR(stbr_info->horizontal_coefficients, stbr_info->total_coefficients * sizeof(float), float); stbr_info->decode_buffer = STBR__NEXT_MEMPTR(stbr_info->vertical_coefficients, stbr_info->kernel_texel_width * sizeof(float), float); stbr_info->ring_buffer = STBR__NEXT_MEMPTR(stbr_info->decode_buffer, input_w * channels * sizeof(float), float); stbr_info->encode_buffer = STBR__NEXT_MEMPTR(stbr_info->ring_buffer, output_w * channels * sizeof(float) * stbr_info->kernel_texel_width, float); #undef STBR__NEXT_MEMPTR // This signals that the ring buffer is empty stbr_info->ring_buffer_begin_index = -1; stbr__calculate_horizontal_filters(stbr_info); float scale_ratio = (float)output_h / input_h; float out_scanlines_radius = stbr__filter_info_table[filter].support * scale_ratio; for (y = 0; y < output_h; y++) { float in_center_of_out; // Center of the current out scanline in the in scanline space int in_first_scanline, in_last_scanline; stbr__calculate_sample_range(y, out_scanlines_radius, scale_ratio, &in_first_scanline, &in_last_scanline, &in_center_of_out); STBR_DEBUG_ASSERT(in_last_scanline - in_first_scanline <= stbr_info->kernel_texel_width); STBR_DEBUG_ASSERT(in_first_scanline >= 0); STBR_DEBUG_ASSERT(in_last_scanline < input_w); if (stbr_info->ring_buffer_begin_index >= 0) { // Get rid of whatever we don't need anymore. while (in_first_scanline > stbr_info->ring_buffer_first_scanline) { if (stbr_info->ring_buffer_first_scanline == stbr_info->ring_buffer_last_scanline) { // We just popped the last scanline off the ring buffer. // Reset it to the empty state. stbr_info->ring_buffer_begin_index = -1; stbr_info->ring_buffer_first_scanline = 0; stbr_info->ring_buffer_last_scanline = 0; break; } else stbr_info->ring_buffer_first_scanline++; } } // Load in new ones. if (stbr_info->ring_buffer_begin_index < 0) stbr__decode_and_resample(stbr_info, in_first_scanline); while (in_last_scanline < stbr_info->ring_buffer_last_scanline) stbr__decode_and_resample(stbr_info, stbr_info->ring_buffer_last_scanline + 1); // Now all buffers should be ready to do a row a vertical sampling. stbr__resample_vertical(stbr_info, y, in_first_scanline, in_last_scanline, in_center_of_out); } #ifdef STBR_DEBUG_OVERWRITE_TEST STBR_DEBUG_ASSERT(memcmp(overwrite_output_pre, &((unsigned char*)output_data)[begin_forbidden], OVERWRITE_ARRAY_SIZE) == 0); STBR_DEBUG_ASSERT(memcmp(overwrite_tempmem_pre, &((unsigned char*)tempmem)[tempmem_size_in_bytes], OVERWRITE_ARRAY_SIZE) == 0); #endif return 1; } STBRDEF stbr_size_t stbr_calculate_memory(int input_w, int input_h, int input_stride_in_bytes, int output_w, int output_h, int output_stride_in_bytes, int channels, stbr_filter filter) { STBR_ASSERT(filter != 0); STBR_ASSERT(filter < STBR_ARRAY_SIZE(stbr__filter_info_table)); int info_size = sizeof(stbr__info); int decode_buffer_size = input_w * channels * sizeof(float); int contributors_size = output_w * sizeof(stbr__contributors); int horizontal_coefficients_size = stbr__get_total_coefficients(filter, input_w, output_w) * sizeof(float); int vertical_coefficients_size = stbr__get_filter_texel_width(filter, output_w > input_w ? 1 : 0) * sizeof(float); int ring_buffer_size = output_w * channels * sizeof(float) * stbr__get_filter_texel_width(filter, output_w > input_w ? 1 : 0); int encode_buffer_size = channels * sizeof(float); return info_size + decode_buffer_size + contributors_size + horizontal_coefficients_size + vertical_coefficients_size + ring_buffer_size + encode_buffer_size; } #endif // STB_RESAMPLE_IMPLEMENTATION /* revision history: */