diff options
| author | Dirk Engling <erdgeist@erdgeist.org> | 2014-02-08 23:39:56 +0100 |
|---|---|---|
| committer | Dirk Engling <erdgeist@erdgeist.org> | 2014-02-08 23:39:56 +0100 |
| commit | 4affb3811c4a57cb4e033ddd40f5e99236b59250 (patch) | |
| tree | 87474b22efd29e638d79169f3ea9dd95b52591fe /src | |
| parent | a9d5ab4dbf4a7c3e2caf54c96daecc8468eacf0c (diff) | |
Speed up decompress script by avoiding to wastefully copying a megabyte of data each time we scan for a new decompression offset
Diffstat (limited to 'src')
| -rw-r--r-- | src/decompress.c | 55 |
1 files changed, 29 insertions, 26 deletions
diff --git a/src/decompress.c b/src/decompress.c index 6074db6..fbf33ec 100644 --- a/src/decompress.c +++ b/src/decompress.c | |||
| @@ -1,52 +1,55 @@ | |||
| 1 | #include <zlib.h> | 1 | #include <stdlib.h> |
| 2 | #include <stdio.h> | 2 | #include <stdio.h> |
| 3 | #include <unistd.h> | 3 | #include <unistd.h> |
| 4 | #include <fcntl.h> | 4 | #include <fcntl.h> |
| 5 | #include <string.h> | 5 | #include <string.h> |
| 6 | #include <zlib.h> | ||
| 7 | #include "mystdlib.h" | ||
| 6 | 8 | ||
| 7 | #define XORLEN (29) | 9 | #define XORLEN (29) |
| 8 | #define HUGEBLOCK (1024*1024) | 10 | #define HUGEBLOCK (1024*1024) |
| 9 | 11 | ||
| 10 | int main(int argc, char **argv) { | 12 | int main(int argc, char **argv) { |
| 11 | // int infile = open("/Volumes/DasTelefonbuch/atb/phonebook.db", O_RDONLY); | 13 | MAP in = map_file( argv[1], 1 ); |
| 12 | |||
| 13 | int infile = open( argv[1], O_RDONLY); | ||
| 14 | 14 | ||
| 15 | unsigned const char xorkey [XORLEN] = "Just for Fun. Linus Torvalds."; | 15 | unsigned const char xorkey [XORLEN] = "Just for Fun. Linus Torvalds."; |
| 16 | unsigned char input [HUGEBLOCK]; | 16 | unsigned char input [XORLEN]; |
| 17 | unsigned char output [HUGEBLOCK]; | 17 | unsigned char output [HUGEBLOCK]; |
| 18 | char respath[32]; /* file_XXXXX\0 */ | 18 | char respath[32]; /* file_XXXXX\0 */ |
| 19 | int i, offs = 0, zres = 0, filenum = 0, resfile, avail=1; | 19 | int i, zres = 0, filenum = 0, resfile; |
| 20 | z_stream z; memset( &z, 0, sizeof(z)); | 20 | size_t offs = 0; |
| 21 | 21 | ||
| 22 | while( avail ) { | 22 | z_stream z; memset( &z, 0, sizeof(z)); |
| 23 | do { | ||
| 24 | lseek( infile, offs, SEEK_SET ); | ||
| 25 | avail = read( infile, input, HUGEBLOCK ); | ||
| 26 | if( !avail) break; | ||
| 27 | for( i=0; i<XORLEN; ++i ) input[i] ^= xorkey[i]; | ||
| 28 | 23 | ||
| 29 | z.next_in = input; z.avail_in = avail; | 24 | while( offs < in->size - XORLEN ) { |
| 30 | z.next_out = output; z.avail_out = HUGEBLOCK; | 25 | for( i=0; i<XORLEN; ++i ) input[i] = in->addr[offs+i] ^ xorkey[i]; |
| 31 | inflateInit( &z ); zres = inflate( &z, Z_NO_FLUSH ); | 26 | z.next_in = input; z.avail_in = XORLEN; |
| 27 | z.next_out = output; z.avail_out = HUGEBLOCK; | ||
| 28 | inflateInit( &z ); zres = inflate( &z, Z_NO_FLUSH ); | ||
| 29 | if( (zres != Z_OK) && (zres != Z_STREAM_END) ) | ||
| 30 | goto error_continue; | ||
| 32 | 31 | ||
| 33 | if( (zres != Z_OK) && (zres != Z_STREAM_END) ) { | 32 | z.next_in = in->addr + offs + XORLEN; z.avail_in = in->size - offs - XORLEN; |
| 34 | inflateEnd(&z); memset( &z, 0, sizeof(z)); | 33 | while( zres == Z_OK ) zres = inflate( &z, Z_NO_FLUSH ); |
| 35 | offs++; | ||
| 36 | } | ||
| 37 | } while((zres != Z_OK) && (zres != Z_STREAM_END)); | ||
| 38 | 34 | ||
| 39 | if( !avail ) break; | 35 | if( zres != Z_STREAM_END ) { |
| 40 | if( zres == Z_OK) while( inflate( &z, Z_NO_FLUSH ) == Z_OK ); | 36 | error_continue: |
| 37 | inflateEnd(&z); memset( &z, 0, sizeof(z)); | ||
| 38 | offs++; | ||
| 39 | continue; | ||
| 40 | } | ||
| 41 | 41 | ||
| 42 | sprintf( respath, "file_%05X", filenum++ ); | 42 | sprintf( respath, "file_%05X", filenum++ ); |
| 43 | resfile = open( respath, O_RDWR | O_CREAT, 0644 ); | 43 | resfile = open( respath, O_RDWR | O_CREAT, 0644 ); |
| 44 | /* I know, I know, error checking */ | 44 | if( resfile < 0 ) { |
| 45 | fprintf( stderr, "Could not open output file %s\n", respath ); | ||
| 46 | exit(1); | ||
| 47 | } | ||
| 45 | write( resfile, output, z.total_out ); | 48 | write( resfile, output, z.total_out ); |
| 46 | close( resfile ); | 49 | close( resfile ); |
| 47 | offs += z.total_in; | 50 | offs += z.total_in; |
| 48 | 51 | ||
| 49 | inflateEnd(&z); memset( &z, 0, sizeof(z)); | 52 | inflateEnd(&z); memset( &z, 0, sizeof(z)); |
| 50 | } | 53 | } |
| 51 | close( infile ); | 54 | unmap_file(&in); |
| 52 | } | 55 | } |
