浏览代码

branchless float saturation

pull/4832/head
Bigfoot71 3 周前
父节点
当前提交
f305490c33
共有 1 个文件被更改,包括 26 次插入12 次删除
  1. +26
    -12
      src/external/rlsw.h

+ 26
- 12
src/external/rlsw.h 查看文件

@ -444,6 +444,27 @@ static inline void sw_vec4_transform(float dst[4], const float v[4], const sw_ma
}
}
static inline float sw_saturate(float x)
{
// After several comparisons, this saturation method
// seems to be the most optimized by GCC and Clang,
// and it does not produce any conditional branching.
// However, it is possible that a clamp could be
// more efficient on certain platforms.
// Comparisons will need to be made.
// SEE: https://godbolt.org/z/5qYznK5zj
// Saturation from below: max(0, x)
float y = 0.5f * (x + fabsf(x));
// Saturation from above: min(1, y)
return y - 0.5f * ((y - 1.0f) + fabsf(y - 1.0f));
// return (x < 0.0f) ? 0.0f : ((x > 1.0f) ? 1.0f : x);
}
static inline float sw_lerp(float a, float b, float t)
{
return a + t * (b - a);
@ -700,8 +721,7 @@ static inline void sw_map_repeat(int* out, float in, int max)
static inline void sw_map_clamp_to_edge(int* out, float in, int max)
{
in = (in > 1.0f) ? 1.0f : ((in < 0.0f) ? 0.0f : in);
*out = (int)(in * (max - 1) + 0.5f);
*out = (int)(sw_saturate(in) * (max - 1) + 0.5f);
}
static inline void sw_map_mirrored_repeat(int* out, float in, int max)
@ -991,12 +1011,9 @@ void FUNC_NAME(const sw_texture_t* tex, const sw_vertex_t* start,
\
/* Interpolate the color and modulate by the texture color */ \
for (int i = 0; i < 4; i++) { \
float lerp = start->color[i] + t * dcol[i]; \
float finalColor = texColor[i] * lerp; \
/* Inline clamp to keep the value between 0 and 1 */ \
/* NOTE: The need for clamp the colors could be a sign of problem during interpolation (?) */ \
finalColor = (finalColor < 0.0f) ? 0.0f : (finalColor > 1.0f ? 1.0f : finalColor); \
dst[i] = (uint8_t)(finalColor * 255.0f); \
float finalColor = texColor[i]; \
finalColor *= start->color[i] + t * dcol[i]; \
dst[i] = (uint8_t)(sw_saturate(finalColor) * 255.0f); \
} \
} \
else \
@ -1004,10 +1021,7 @@ void FUNC_NAME(const sw_texture_t* tex, const sw_vertex_t* start,
/* Interpolate the color */ \
for (int i = 0; i < 4; i++) { \
float finalColor = start->color[i] + t * dcol[i]; \
/* Inline clamp to keep the value between 0 and 1 */ \
/* NOTE: The need for clamp the colors could be a sign of problem during interpolation (?) */ \
finalColor = (finalColor < 0.0f) ? 0.0f : (finalColor > 1.0f ? 1.0f : finalColor); \
dst[i] = (uint8_t)(finalColor * 255.0f); \
dst[i] = (uint8_t)(sw_saturate(finalColor) * 255.0f); \
} \
} \
\

正在加载...
取消
保存