X-Git-Url: https://git.sesse.net/?p=fjl;a=blobdiff_plain;f=dehuff.h;h=7621f6095e99791feb6138e81c2574ae9dda6bce;hp=9243e101530018b346e80e2db8b64b96dee1db61;hb=a4009687c73083dd0290285a065740a83e27e855;hpb=8389f95d5750d6fcb202181005954829e64865b4 diff --git a/dehuff.h b/dehuff.h index 9243e10..7621f60 100644 --- a/dehuff.h +++ b/dehuff.h @@ -81,13 +81,25 @@ static const int bit_thresholds[16] = { 0, 1 << 0, 1 << 1, 1 << 2, 1 << 3, 1 << 4, 1 << 5, 1 << 6, 1 << 7, 1 << 8, 1 << 9, 1 << 10, 1 << 11, 1 << 12, 1 << 13, 1 << 14 }; -static inline unsigned extend(int val, int bits) +static inline unsigned extend(int val, unsigned bits) { +#if defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__)) + // GCC should ideally be able to figure out that the conditional move is better, but + // it doesn't for various reasons, and this is pretty important for speed, so we hardcode. + asm("cmp %2, %0 ; cmovl %3, %0" + : "=r" (val) + : "0" (val), + "g" (bit_thresholds[bits]), + "r" (val + (-1 << bits) + 1) + : "cc"); + return val; +#else if (val < bit_thresholds[bits]) { return val + (-1 << bits) + 1; } else { return val; } +#endif } #endif /* !defined(_DEHUFF_H) */