[Zlib-devel] [PING] Improve longest_match performance

Andreas Krebbel krebbel at linux.vnet.ibm.com
Tue May 7 05:16:57 EDT 2013


Hi,

I've verified that the attached patch helps code generation a lot with zlib 1.2.8 and GCC head (4.9).

The patch just does some very simple type promotions in order to help target platforms where some of
the zero/sign extend instructions are missing or slow.

Please consider the patch for inclusion into the next release. Thanks!

Bye,

-Andreas-



Index: zlib/deflate.c
===================================================================
--- zlib.orig/deflate.c 2013-05-03 13:29:35.648710587 +0200
+++ zlib/deflate.c      2013-05-03 13:29:35.678710589 +0200
@@ -1145,15 +1145,16 @@ local void lm_init (s)
 /* For 80x86 and 680x0, an optimized version will be provided in match.asm or
  * match.S. The code will be functionally equivalent.
  */
-local uInt longest_match(s, cur_match)
+local uInt longest_match(s, pcur_match)
     deflate_state *s;
-    IPos cur_match;                             /* current match */
+    IPos pcur_match;                             /* current match */
 {
+    ptrdiff_t cur_match = pcur_match; /* extend to pointer width */
     unsigned chain_length = s->max_chain_length;/* max hash chain length */
     register Bytef *scan = s->window + s->strstart; /* current string */
     register Bytef *match;                       /* matched string */
     register int len;                           /* length of current match */
-    int best_len = s->prev_length;              /* best match length so far */
+    ptrdiff_t best_len = s->prev_length;              /* best match length so far */
     int nice_match = s->nice_match;             /* stop if match long enough */
     IPos limit = s->strstart > (IPos)MAX_DIST(s) ?
         s->strstart - (IPos)MAX_DIST(s) : NIL;
@@ -1168,12 +1169,12 @@ local uInt longest_match(s, cur_match)
      * Try with and without -DUNALIGNED_OK to check.
      */
     register Bytef *strend = s->window + s->strstart + MAX_MATCH - 1;
-    register ush scan_start = *(ushf*)scan;
-    register ush scan_end   = *(ushf*)(scan+best_len-1);
+    register uInt scan_start = *(ushf*)scan;
+    register uInt scan_end   = *(ushf*)(scan+best_len-1);
 #else
     register Bytef *strend = s->window + s->strstart + MAX_MATCH;
-    register Byte scan_end1  = scan[best_len-1];
-    register Byte scan_end   = scan[best_len];
+    register uInt scan_end1  = scan[best_len-1];
+    register uInt scan_end   = scan[best_len];
 #endif

     /* The code is optimized for HASH_BITS >= 8 and MAX_MATCH-2 multiple of 16.





More information about the Zlib-devel mailing list