gzip: speed up send_bits()
Replace one RMW op with store. This speeds up gzip of a png file by ~2%.
function old new delta
send_bits 62 66 +4
Signed-off-by: Denys Vlasenko <vda.linux@googlemail.com>
diff --git a/archival/gzip.c b/archival/gzip.c
index f253a21..08633d6 100644
--- a/archival/gzip.c
+++ b/archival/gzip.c
@@ -523,7 +523,6 @@
static void send_bits(unsigned value, unsigned length)
{
unsigned new_buf;
- unsigned remain;
#ifdef DEBUG
Tracev((stderr, " l %2d v %4x ", length, value));
@@ -534,25 +533,26 @@
new_buf = G1.bi_buf | (value << G1.bi_valid);
/* NB: the above may sometimes do "<< 32" shift (undefined)
- * if check below is changed to "length > remain" instead of >= */
- remain = BUF_SIZE - G1.bi_valid;
+ * if check below is changed to "length > BUF_SIZE" instead of >= */
+ length += G1.bi_valid;
/* If bi_buf is full */
- if (length >= remain) {
+ if (length >= BUF_SIZE) {
/* ...use (valid) bits from bi_buf and
* (BUF_SIZE - bi_valid) bits from value,
* leaving (width - (BUF_SIZE-bi_valid)) unused bits in value.
*/
+ value >>= (BUF_SIZE - G1.bi_valid);
if (BUF_SIZE == 32) {
put_32bit(new_buf); /* maybe unroll to 2*put_16bit()? */
} else { /* 16 */
put_16bit(new_buf);
}
- new_buf = value >> remain;
+ new_buf = value;
length -= BUF_SIZE;
}
G1.bi_buf = new_buf;
- G1.bi_valid += length;
+ G1.bi_valid = length;
}