diff options
author | sewardj <sewardj@a5019735-40e9-0310-863c-91ae7b9d1cf9> | 2011-05-11 16:04:28 +0000 |
---|---|---|
committer | sewardj <sewardj@a5019735-40e9-0310-863c-91ae7b9d1cf9> | 2011-05-11 16:04:28 +0000 |
commit | d2f95a0c23802cc6694a618bddd314391473f23c (patch) | |
tree | 036eb5fd072845dad833b2b21c66be68a8c51303 /exp-sgcheck/tests | |
parent | 889a6aede01eec00a2c523fc9a12f288082d0dae (diff) |
Rename 'exp-ptrcheck' to 'exp-sgcheck' and hope this does not cause
too much build carnage.
git-svn-id: svn://svn.valgrind.org/valgrind/trunk@11745 a5019735-40e9-0310-863c-91ae7b9d1cf9
Diffstat (limited to 'exp-sgcheck/tests')
138 files changed, 11075 insertions, 0 deletions
diff --git a/exp-sgcheck/tests/Makefile.am b/exp-sgcheck/tests/Makefile.am new file mode 100644 index 00000000..cc2bc3af --- /dev/null +++ b/exp-sgcheck/tests/Makefile.am @@ -0,0 +1,134 @@ + +include $(top_srcdir)/Makefile.tool-tests.am + +dist_noinst_SCRIPTS = filter_stderr filter_add filter_suppgen \ + sh_script + +EXTRA_DIST = \ + is_arch_supported \ + add.vgtest-disabled add.stderr.exp \ + and.vgtest-disabled and.stderr.exp \ + arith.vgtest-disabled arith.stderr.exp \ + arith_include1.c arith_include2.c \ + bad_percentify.vgtest bad_percentify.c \ + bad_percentify.stdout.exp bad_percentify.stderr.exp-glibc28-amd64 \ + base.vgtest \ + base.stderr.exp-glibc25-amd64 base.stderr.exp-glibc25-x86 \ + ccc.vgtest ccc.stderr.exp-glibc25-amd64 \ + ccc.stderr.exp-glibc27-x86 ccc.stderr.exp-glibc28-amd64 \ + cmp.vgtest-disabled cmp.stderr.exp \ + globalerr.vgtest globalerr.stdout.exp \ + globalerr.stderr.exp-glibc28-amd64 \ + fp.vgtest fp.stderr.exp \ + hackedbz2.vgtest hackedbz2.stdout.exp \ + hackedbz2.stderr.exp-glibc28-amd64 \ + hp_bounds.vgtest hp_bounds.stderr.exp \ + hp_dangle.vgtest hp_dangle.stderr.exp \ + hsg.vgtest hsg.stdout.exp hsg.stderr.exp \ + idiv.vgtest-disabled idiv.stderr.exp \ + imul.vgtest-disabled imul.stderr.exp \ + justify.vgtest justify.stderr.exp \ + mm.vgtest-disabled mm.stderr.exp \ + neg.vgtest-disabled neg.stderr.exp \ + not.vgtest-disabled not.stderr.exp \ + or.vgtest-disabled or.stderr.exp \ + partial_bad.vgtest \ + partial_bad.stderr.exp-glibc25-x86 \ + partial_bad.stderr.exp-glibc25-amd64 \ + partial_good.vgtest \ + partial_good.stderr.exp-glibc25-x86 \ + partial_good.stderr.exp-glibc25-amd64 \ + preen_invars.vgtest preen_invars.stdout.exp \ + preen_invars.stderr.exp-glibc28-amd64 \ + pth_create.vgtest pth_create.stderr.exp \ + pth_specific.vgtest pth_specific.stderr.exp \ + realloc.vgtest \ + realloc.stderr.exp-glibc25-x86 realloc.stderr.exp-glibc25-amd64 \ + sh_script.vgtest-disabled sh_script.stderr.exp \ + stackerr.vgtest stackerr.stdout.exp \ + stackerr.stderr.exp-glibc28-amd64 stackerr.stderr.exp-glibc27-x86 \ + strcpy.vgtest strcpy.stderr.exp \ + strlen_bad.vgtest-disabled strlen_bad.stderr.exp \ + strlen_good.vgtest-disabled strlen_good.stderr.exp \ + sub.vgtest-disabled sub.stderr.exp \ + supp.vgtest supp.stderr.exp supp.supp \ + suppgen.vgtest-disabled suppgen.stderr.exp suppgen.stdin \ + syscall.vgtest-disabled syscall.stderr.exp \ + tricky.vgtest tricky.stderr.exp \ + unaligned.vgtest \ + unaligned.stderr.exp-glibc25-x86 unaligned.stderr.exp-glibc25-amd64 \ + xor.vgtest-disabled xor.stderr.exp \ + zero.vgtest zero.stderr.exp + +check_PROGRAMS = \ + add and arith bad_percentify base cmp fp \ + globalerr hackedbz2 \ + hp_bounds hp_dangle hsg idiv imul \ + justify mm not neg or partial \ + preen_invars preen_invars_so.so \ + pth_create pth_specific realloc \ + stackerr \ + strcpy strlen sub supp syscall tricky unaligned xor zero + +# DDD: not sure if these ones should work on Darwin or not... if not, should +# be moved into x86-linux/. +if ! VGCONF_OS_IS_DARWIN + check_PROGRAMS += \ + ccc +endif + + +AM_CFLAGS += $(AM_FLAG_M3264_PRI) +AM_CXXFLAGS += $(AM_FLAG_M3264_PRI) + +# To make it a bit more realistic, build hackedbz2.c with at +# least some optimisation. +hackedbz2_CFLAGS = $(AM_CFLAGS) -O -Wno-inline + +# C ones +pth_create_LDADD = -lpthread +pth_specific_LDADD = -lpthread + +# C++ ones +ccc_SOURCES = ccc.cpp + +# Build shared object for preen_invars +preen_invars_DEPENDENCIES = preen_invars_so.so +if VGCONF_PLATFORMS_INCLUDE_PPC64_AIX5 + preen_invars_LDADD = -ldl + preen_invars_LDFLAGS = $(AM_FLAG_M3264_PRI) +else +if VGCONF_PLATFORMS_INCLUDE_PPC32_AIX5 + preen_invars_LDADD = -ldl + preen_invars_LDFLAGS = $(AM_FLAG_M3264_PRI) -Wl,-G -Wl,-bnogc +else +if VGCONF_OS_IS_DARWIN + preen_invars_LDADD = -ldl + preen_invars_LDFLAGS = $(AM_FLAG_M3264_PRI) +else + preen_invars_LDADD = -ldl + preen_invars_LDFLAGS = $(AM_FLAG_M3264_PRI) \ + -Wl,-rpath,$(top_builddir)/memcheck/tests +endif +endif +endif + +preen_invars_so_so_SOURCES = preen_invars_so.c # For automake-1.7. +preen_invars_so_so_CFLAGS = $(AM_CFLAGS) -fpic +if VGCONF_PLATFORMS_INCLUDE_PPC64_AIX5 + preen_invars_so_so_LDFLAGS = -fpic $(AM_FLAG_M3264_PRI) -shared +else +if VGCONF_PLATFORMS_INCLUDE_PPC32_AIX5 + preen_invars_so_so_LDFLAGS = -fpic $(AM_FLAG_M3264_PRI) -shared \ + -Wl,-G -Wl,-bnogc +else +if VGCONF_OS_IS_DARWIN + preen_invars_so_so_LDFLAGS = -fpic $(AM_FLAG_M3264_PRI) -dynamic \ + -dynamiclib -all_load +else + preen_invars_so_so_LDFLAGS = -fpic $(AM_FLAG_M3264_PRI) -shared \ + -Wl,-soname -Wl,preen_invars_so.so +endif +endif +endif + diff --git a/exp-sgcheck/tests/add.c b/exp-sgcheck/tests/add.c new file mode 100644 index 00000000..f861a628 --- /dev/null +++ b/exp-sgcheck/tests/add.c @@ -0,0 +1,40 @@ +#include <stdio.h> +#include <stdlib.h> +#include <signal.h> +#include <setjmp.h> +#include <assert.h> + +#include "arith_include1.c" + +int main(void) +{ + #include "arith_include2.c" + + // ADD ========================================================= + g(+, n, n, n); // det, det + + g(+, n, p, p); // ok, det + + g(+, p, n, p); // ok, det + + g(+, p, p, e); // detected bad add; det, det + + g(+, n, un, u); // undet, undet + g(+, n, up, u); // ok, undet + + g(+, un, n, u); // undet, undet + g(+, up, n, u); // ok, undet + + g(+, un, un, u); // undet, undet + g(+, un, up, u); // undet, undet + g(+, up, un, u); // undet, undet + g(+, up, up, u); // undetected bad add; undet, undet + + g(+, un, p, u); // undet, undet + g(+, up, p, u); // undetected bad add; undet, undet + + g(+, p, un, u); // undet, undet + g(+, p, up, u); // undetected bad add; undet, undet + + return 0; +} diff --git a/exp-sgcheck/tests/add.stderr.exp b/exp-sgcheck/tests/add.stderr.exp new file mode 100644 index 00000000..e4e0f11f --- /dev/null +++ b/exp-sgcheck/tests/add.stderr.exp @@ -0,0 +1,70 @@ + +about to do 14 [0] +Invalid read of size 4 + at 0x........: main (add.c:14) + Address 0x........ is not derived from any known block +about to do 14 [-1] + +Invalid read of size 4 + at 0x........: main (add.c:14) + Address 0x........ is not derived from any known block +about to do 16 [0] +about to do 16 [-1] + +Invalid read of size 4 + at 0x........: main (add.c:16) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 18 [0] +about to do 18 [-1] + +Invalid read of size 4 + at 0x........: main (add.c:18) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + +Invalid arguments to Add32/Add64 + at 0x........: main (add.c:20) + Both args derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 20 [0] + +Invalid read of size 4 + at 0x........: main (add.c:20) + Address 0x........ is not derived from any known block +about to do 20 [-1] + +Invalid read of size 4 + at 0x........: main (add.c:20) + Address 0x........ is not derived from any known block +about to do 22 [0] +about to do 22 [-1] +about to do 23 [0] +about to do 23 [-1] +about to do 25 [0] +about to do 25 [-1] +about to do 26 [0] +about to do 26 [-1] +about to do 28 [0] +about to do 28 [-1] +about to do 29 [0] +about to do 29 [-1] +about to do 30 [0] +about to do 30 [-1] +about to do 31 [0] +about to do 31 [-1] +about to do 33 [0] +about to do 33 [-1] +about to do 34 [0] +about to do 34 [-1] +about to do 36 [0] +about to do 36 [-1] +about to do 37 [0] +about to do 37 [-1] + +ERROR SUMMARY: 7 errors from 7 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/add.vgtest-disabled b/exp-sgcheck/tests/add.vgtest-disabled new file mode 100644 index 00000000..1fb7c795 --- /dev/null +++ b/exp-sgcheck/tests/add.vgtest-disabled @@ -0,0 +1,2 @@ +prog: add +stderr_filter: filter_add diff --git a/exp-sgcheck/tests/and.c b/exp-sgcheck/tests/and.c new file mode 100644 index 00000000..09a1ef51 --- /dev/null +++ b/exp-sgcheck/tests/and.c @@ -0,0 +1,49 @@ +#include <stdio.h> +#include <stdlib.h> +#include <signal.h> +#include <setjmp.h> +#include <assert.h> + +#include "arith_include1.c" + +int main(void) +{ + #include "arith_include2.c" + + // Not testing the n&p-->p type cases, too hard to find an 'n' that gives + // something that looks like a pointer! (Eg. if the pointer is + // 0x40c38000, masking to 0x40000000 won't give invalid memory, and + // masking below that, eg. to 0x00c38000 doesn't give a pointer result.) + + // AND ========================================================= + g(&, n, n, n); // det, det + + g(&, n, p, n); // det, det + g(&, nFF,p, n); // ok, det + + g(&, p, n, n); // det, det + g(&, p, nFF,n); // ok, det + + g(&, p, p, p); // ok, det + g(&, p, p2, e); // bad AND detected; det, det + + g(&, n, un, n); // det, det + g(&, n, up, n); // det, det + + g(&, un, n, n); // det, det + g(&, up, n, n); // det, det + + g(&, un, un, u); // undet, undet + g(&, un, up, n); // det, det + g(&, up, un, n); // det, det + g(&, up, up, u); // ok, undet + g(&, up, up2,u); // undet, undet + + g(&, un, p, n); // det, det + g(&, up, p, n); // det, det (result doesn't look like a pointer) + + g(&, p, un, n); // det, det + g(&, p, up, u); // det, det + + return 0; +} diff --git a/exp-sgcheck/tests/and.stderr.exp b/exp-sgcheck/tests/and.stderr.exp new file mode 100644 index 00000000..9ef37301 --- /dev/null +++ b/exp-sgcheck/tests/and.stderr.exp @@ -0,0 +1,184 @@ + +about to do 19 [0] +Invalid read of size 4 + at 0x........: main (and.c:19) + Address 0x........ is not derived from any known block +about to do 19 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:19) + Address 0x........ is not derived from any known block +about to do 21 [0] + +Invalid read of size 4 + at 0x........: main (and.c:21) + Address 0x........ is not derived from any known block +about to do 21 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:21) + Address 0x........ is not derived from any known block +about to do 22 [0] +about to do 22 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:22) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 24 [0] + +Invalid read of size 4 + at 0x........: main (and.c:24) + Address 0x........ is not derived from any known block +about to do 24 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:24) + Address 0x........ is not derived from any known block +about to do 25 [0] +about to do 25 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:25) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 27 [0] +about to do 27 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:27) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + +Invalid arguments to And32/And64 + at 0x........: main (and.c:28) + First arg derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + Second arg derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 28 [0] + +Invalid read of size 4 + at 0x........: main (and.c:28) + Address 0x........ is not derived from any known block +about to do 28 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:28) + Address 0x........ is not derived from any known block +about to do 30 [0] + +Invalid read of size 4 + at 0x........: main (and.c:30) + Address 0x........ is not derived from any known block +about to do 30 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:30) + Address 0x........ is not derived from any known block +about to do 31 [0] + +Invalid read of size 4 + at 0x........: main (and.c:31) + Address 0x........ is not derived from any known block +about to do 31 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:31) + Address 0x........ is not derived from any known block +about to do 33 [0] + +Invalid read of size 4 + at 0x........: main (and.c:33) + Address 0x........ is not derived from any known block +about to do 33 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:33) + Address 0x........ is not derived from any known block +about to do 34 [0] + +Invalid read of size 4 + at 0x........: main (and.c:34) + Address 0x........ is not derived from any known block +about to do 34 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:34) + Address 0x........ is not derived from any known block +about to do 36 [0] +about to do 36 [-1] +about to do 37 [0] + +Invalid read of size 4 + at 0x........: main (and.c:37) + Address 0x........ is not derived from any known block +about to do 37 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:37) + Address 0x........ is not derived from any known block +about to do 38 [0] + +Invalid read of size 4 + at 0x........: main (and.c:38) + Address 0x........ is not derived from any known block +about to do 38 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:38) + Address 0x........ is not derived from any known block +about to do 39 [0] +about to do 39 [-1] +about to do 40 [0] +about to do 40 [-1] +about to do 42 [0] + +Invalid read of size 4 + at 0x........: main (and.c:42) + Address 0x........ is not derived from any known block +about to do 42 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:42) + Address 0x........ is not derived from any known block +about to do 43 [0] + +Invalid read of size 4 + at 0x........: main (and.c:43) + Address 0x........ is not derived from any known block +about to do 43 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:43) + Address 0x........ is not derived from any known block +about to do 45 [0] + +Invalid read of size 4 + at 0x........: main (and.c:45) + Address 0x........ is not derived from any known block +about to do 45 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:45) + Address 0x........ is not derived from any known block +about to do 46 [0] + +Invalid read of size 4 + at 0x........: main (and.c:46) + Address 0x........ is not derived from any known block +about to do 46 [-1] + +Invalid read of size 4 + at 0x........: main (and.c:46) + Address 0x........ is not derived from any known block + +ERROR SUMMARY: 32 errors from 32 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/and.vgtest-disabled b/exp-sgcheck/tests/and.vgtest-disabled new file mode 100644 index 00000000..2a276120 --- /dev/null +++ b/exp-sgcheck/tests/and.vgtest-disabled @@ -0,0 +1,2 @@ +prog: and +stderr_filter: filter_add diff --git a/exp-sgcheck/tests/arith.c b/exp-sgcheck/tests/arith.c new file mode 100644 index 00000000..32af88c9 --- /dev/null +++ b/exp-sgcheck/tests/arith.c @@ -0,0 +1,57 @@ + +#include <stdlib.h> + +typedef unsigned long Ulong; + +int main(void) +{ + long* x = malloc(sizeof(long) * 10); + long* y = malloc(sizeof(long) * 10); + long* y2 = y + 3; + + // ok -- same segment + long w = y2 - y; + + // ok -- different heap segments (result can only be used to index off + // 'x', but glibc's strcpy() does this...) + long* z = (long*)((long)x - (long)y); + + w = (long)y2 + (long)y; // bad (same segment) + + w = (long)x & (long)y; // bad (different segments) + + w = (long)y2 / (long)4; // bad, but indistinguishable from + // acceptable '%' cases... + + w = (long)y2 % (long)4; // ok + w = (long)y2 % (long)y; // bad -- modulor(?) is a pointer + w = (long)0xffffffff % (long)y; // bad -- modulend(?) is a non-pointer + + w = (Ulong)y2 % (Ulong)4; // ok + w = (Ulong)y2 % (Ulong)y; // bad -- modulor(?) is a pointer + w = (Ulong)0xffffffff % (Ulong)y; // bad -- modulend(?) is a non-pointer + + w = (long)y * (long)y2; // bad + + w = (long)y >> (long)2; // ok + w = (long)y << (long)2; // ok + + w = (long)y & 0xffff; // ok + w = (long)y | 0xffff; // ok + w = (long)y ^ (long)y2; // ok + + w = ~((long)y); // ok + + w = -((long)y); // bad -- operand is a non-polonger + + w = (long)x ^ (long)x; // xor(ptr,ptr) --> constant (0) + z = x + w; // ok, because xor result was zero + + w = (long)x ^ ((long)x+1); // xor(ptr,ptr') --> constant (small) + z = x + w; // ok, because xor result was constant + + w = (long)x ^ (long)y; // xor(ptr,ptr') --> constant (small) + z = x + w; // ok, because xor result was constant + + return (long)z; +} diff --git a/exp-sgcheck/tests/arith.stderr.exp b/exp-sgcheck/tests/arith.stderr.exp new file mode 100644 index 00000000..4af05c54 --- /dev/null +++ b/exp-sgcheck/tests/arith.stderr.exp @@ -0,0 +1,79 @@ + +Invalid ADD + at 0x........: main (arith.c:19) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Both args derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith.c:9) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + +Invalid AND + at 0x........: main (arith.c:21) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First arg derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith.c:9) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Second arg derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith.c:8) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + +Invalid IDIV + at 0x........: main (arith.c:27) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Both args derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith.c:9) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + +Invalid IDIV + at 0x........: main (arith.c:28) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First arg not a pointer +Second arg derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith.c:9) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + +Invalid DIV + at 0x........: main (arith.c:31) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Both args derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith.c:9) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + +Invalid DIV + at 0x........: main (arith.c:32) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First arg not a pointer +Second arg derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith.c:9) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + +Invalid IMUL + at 0x........: main (arith.c:34) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Both args derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith.c:9) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + +ERROR SUMMARY: 7 errors from 7 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/arith.vgtest-disabled b/exp-sgcheck/tests/arith.vgtest-disabled new file mode 100644 index 00000000..5a6f6076 --- /dev/null +++ b/exp-sgcheck/tests/arith.vgtest-disabled @@ -0,0 +1 @@ +prog: arith diff --git a/exp-sgcheck/tests/arith_include1.c b/exp-sgcheck/tests/arith_include1.c new file mode 100644 index 00000000..dfbbe6b9 --- /dev/null +++ b/exp-sgcheck/tests/arith_include1.c @@ -0,0 +1,17 @@ +#include <stdio.h> +#include <stdlib.h> +#include <signal.h> +#include <setjmp.h> +#include <assert.h> +#include <string.h> + +static jmp_buf TTT_jmpbuf; + +void SEGV_handler(int signum) +{ + //fprintf(stderr, "segv caught\n"); + __builtin_longjmp(TTT_jmpbuf, 1); +} + +int up[10], up2[10]; + diff --git a/exp-sgcheck/tests/arith_include2.c b/exp-sgcheck/tests/arith_include2.c new file mode 100644 index 00000000..524ca997 --- /dev/null +++ b/exp-sgcheck/tests/arith_include2.c @@ -0,0 +1,41 @@ + + // Comment "both" means tp[0] and tp[-1] are both bad. + // Otherwise only tp[-1] is bad. + + #define TTT \ + if (__builtin_setjmp(TTT_jmpbuf) == 0) \ + { fprintf(stderr, "about to do %d [0]\n", __LINE__); tn = tp[ 0]; } \ + if (__builtin_setjmp(TTT_jmpbuf) == 0) \ + { fprintf(stderr, "about to do %d [-1]\n", __LINE__); tn = tp[-1]; } + + #define b( a, c) tp = (long*)a; TTT + #define ui(op, a, c) tp = (long*)op(long)a; TTT + #define g(op, a,b,c) tp = (long*)((long)a op (long)b); TTT + #define UNU __attribute__((unused)) + + struct sigaction sigsegv; + // Scratch values + long a, tn __attribute__((unused)); + long* tp; + + // Known pointers + long* p = malloc(sizeof(long)*10); UNU long* p2 = malloc(sizeof(long)*10); + UNU long* pp = p; + // Unknown pointers +// long up[10], UNU up2[10]; + + // Known nonptrs; make them zero and known + long n = a ^ a, UNU n2 = n+1, UNU n7F = 0x7fffffffUL, UNU nFF = ~n; + + // Unknown nonptrs; make them zero but unknown + long un = 0x01100000UL, UNU un2 = un; + + // Known nonptr, from pointerness range check + UNU long nn = 0; + + // Intall SEGV handler + memset(&sigsegv, 0, sizeof(sigsegv)); + sigsegv.sa_handler = SEGV_handler; + sigsegv.sa_flags = SA_NODEFER; /* so we can handle signal many times */ + assert( 0 == sigemptyset( &sigsegv.sa_mask ) ); + assert( 0 == sigaction(SIGSEGV, &sigsegv, NULL) ); diff --git a/exp-sgcheck/tests/bad_percentify.c b/exp-sgcheck/tests/bad_percentify.c new file mode 100644 index 00000000..2567742c --- /dev/null +++ b/exp-sgcheck/tests/bad_percentify.c @@ -0,0 +1,109 @@ + +/* This demonstrates a stack overrun bug that exp-ptrcheck found while + running Valgrind itself (self hosting). As at 12 Sept 08 this bug + is still in Valgrind. */ + +#include <stdio.h> +#include <stdlib.h> +#include <assert.h> +#include <string.h> + +typedef unsigned long long int ULong; +typedef unsigned int UInt; +typedef signed int Int; +typedef char Char; + +/* --------------------------------------------------------------------- + percentify() + ------------------------------------------------------------------ */ + +/* This part excerpted from coregrind/m_libcbase.c */ + +// Percentify n/m with d decimal places. Includes the '%' symbol at the end. +// Right justifies in 'buf'. +void VG_percentify(ULong n, ULong m, UInt d, Int n_buf, char buf[]) +{ + Int i, len, space; + ULong p1; + Char fmt[32]; + + if (m == 0) { + // Have to generate the format string in order to be flexible about + // the width of the field. + sprintf(fmt, "%%-%ds", n_buf); + // fmt is now "%<n_buf>s" where <d> is 1,2,3... + sprintf(buf, fmt, "--%"); + return; + } + + p1 = (100*n) / m; + + if (d == 0) { + sprintf(buf, "%lld%%", p1); + } else { + ULong p2; + UInt ex; + switch (d) { + case 1: ex = 10; break; + case 2: ex = 100; break; + case 3: ex = 1000; break; + default: assert(0); + /* was: VG_(tool_panic)("Currently can only handle 3 decimal places"); */ + } + p2 = ((100*n*ex) / m) % ex; + // Have to generate the format string in order to be flexible about + // the width of the post-decimal-point part. + sprintf(fmt, "%%lld.%%0%dlld%%%%", d); + // fmt is now "%lld.%0<d>lld%%" where <d> is 1,2,3... + sprintf(buf, fmt, p1, p2); + } + + len = strlen(buf); + space = n_buf - len; + if (space < 0) space = 0; /* Allow for v. small field_width */ + i = len; + + /* Right justify in field */ + for ( ; i >= 0; i--) buf[i + space] = buf[i]; + for (i = 0; i < space; i++) buf[i] = ' '; +} + + +/*------------------------------------------------------------*/ +/*--- Stats ---*/ +/*------------------------------------------------------------*/ + +/* This part excerpted from coregrind/m_translate.c */ + +static UInt n_SP_updates_fast = 0; +static UInt n_SP_updates_generic_known = 0; +static UInt n_SP_updates_generic_unknown = 0; + +void VG_print_translation_stats ( void ) +{ + Char buf[6]; + UInt n_SP_updates = n_SP_updates_fast + n_SP_updates_generic_known + + n_SP_updates_generic_unknown; + VG_percentify(n_SP_updates_fast, n_SP_updates, 1, 6, buf); + printf( + "translate: fast SP updates identified: %'u (%s)\n", + n_SP_updates_fast, buf ); + + VG_percentify(n_SP_updates_generic_known, n_SP_updates, 1, 6, buf); + printf( + "translate: generic_known SP updates identified: %'u (%s)\n", + n_SP_updates_generic_known, buf ); + + VG_percentify(n_SP_updates_generic_unknown, n_SP_updates, 1, 6, buf); + printf( + "translate: generic_unknown SP updates identified: %'u (%s)\n", + n_SP_updates_generic_unknown, buf ); +} + + + +int main ( void ) +{ + VG_print_translation_stats(); + return 0; +} diff --git a/exp-sgcheck/tests/bad_percentify.stderr.exp-glibc28-amd64 b/exp-sgcheck/tests/bad_percentify.stderr.exp-glibc28-amd64 new file mode 100644 index 00000000..b647e4a4 --- /dev/null +++ b/exp-sgcheck/tests/bad_percentify.stderr.exp-glibc28-amd64 @@ -0,0 +1,33 @@ + +Invalid read of size 1 + at 0x........: strlen (h_intercepts.c:...) + by 0x........: ... + by 0x........: ... + by 0x........: VG_print_translation_stats (bad_percentify.c:88) + by 0x........: main (bad_percentify.c:107) + Address 0x........ expected vs actual: + Expected: stack array "buf" in frame 3 back from here + Actual: unknown + +Invalid read of size 1 + at 0x........: strlen (h_intercepts.c:...) + by 0x........: ... + by 0x........: ... + by 0x........: VG_print_translation_stats (bad_percentify.c:93) + by 0x........: main (bad_percentify.c:107) + Address 0x........ expected vs actual: + Expected: stack array "buf" in frame 3 back from here + Actual: unknown + +Invalid read of size 1 + at 0x........: strlen (h_intercepts.c:...) + by 0x........: ... + by 0x........: ... + by 0x........: VG_print_translation_stats (bad_percentify.c:98) + by 0x........: main (bad_percentify.c:107) + Address 0x........ expected vs actual: + Expected: stack array "buf" in frame 3 back from here + Actual: unknown + + +ERROR SUMMARY: 3 errors from 3 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/bad_percentify.stdout.exp b/exp-sgcheck/tests/bad_percentify.stdout.exp new file mode 100644 index 00000000..fd99c2c1 --- /dev/null +++ b/exp-sgcheck/tests/bad_percentify.stdout.exp @@ -0,0 +1,3 @@ +translate: fast SP updates identified: 0 (--% ) +translate: generic_known SP updates identified: 0 (--% ) +translate: generic_unknown SP updates identified: 0 (--% ) diff --git a/exp-sgcheck/tests/bad_percentify.vgtest b/exp-sgcheck/tests/bad_percentify.vgtest new file mode 100644 index 00000000..1f390b02 --- /dev/null +++ b/exp-sgcheck/tests/bad_percentify.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: bad_percentify diff --git a/exp-sgcheck/tests/base.c b/exp-sgcheck/tests/base.c new file mode 100644 index 00000000..e24b57b1 --- /dev/null +++ b/exp-sgcheck/tests/base.c @@ -0,0 +1,25 @@ +#include <stdio.h> +#include <stdlib.h> +#include <signal.h> +#include <setjmp.h> +#include <assert.h> + +#include "arith_include1.c" + +int main(void) +{ + #include "arith_include2.c" + + // Base ======================================================== + b(p, p); // ok + + b(up, u); // ok + + b(un, u); // undet + + b(n, n); // det + + b(nn, n); // det + + return 0; +} diff --git a/exp-sgcheck/tests/base.stderr.exp-glibc25-amd64 b/exp-sgcheck/tests/base.stderr.exp-glibc25-amd64 new file mode 100644 index 00000000..ebe053b1 --- /dev/null +++ b/exp-sgcheck/tests/base.stderr.exp-glibc25-amd64 @@ -0,0 +1,36 @@ + +about to do 14 [0] +about to do 14 [-1] +Invalid read of size 8 + at 0x........: main (base.c:14) + Address 0x........ is 8 bytes before the accessing pointer's + legitimate range, a block of size 80 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + +about to do 16 [0] +about to do 16 [-1] +about to do 18 [0] +about to do 18 [-1] +about to do 20 [0] +Invalid read of size 8 + at 0x........: main (base.c:20) + Address 0x........ is not derived from any known block + +about to do 20 [-1] +Invalid read of size 8 + at 0x........: main (base.c:20) + Address 0x........ is not derived from any known block + +about to do 22 [0] +Invalid read of size 8 + at 0x........: main (base.c:22) + Address 0x........ is not derived from any known block + +about to do 22 [-1] +Invalid read of size 8 + at 0x........: main (base.c:22) + Address 0x........ is not derived from any known block + + +ERROR SUMMARY: 5 errors from 5 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/base.stderr.exp-glibc25-x86 b/exp-sgcheck/tests/base.stderr.exp-glibc25-x86 new file mode 100644 index 00000000..a525dc99 --- /dev/null +++ b/exp-sgcheck/tests/base.stderr.exp-glibc25-x86 @@ -0,0 +1,36 @@ + +about to do 14 [0] +about to do 14 [-1] +Invalid read of size 4 + at 0x........: main (base.c:14) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + +about to do 16 [0] +about to do 16 [-1] +about to do 18 [0] +about to do 18 [-1] +about to do 20 [0] +Invalid read of size 4 + at 0x........: main (base.c:20) + Address 0x........ is not derived from any known block + +about to do 20 [-1] +Invalid read of size 4 + at 0x........: main (base.c:20) + Address 0x........ is not derived from any known block + +about to do 22 [0] +Invalid read of size 4 + at 0x........: main (base.c:22) + Address 0x........ is not derived from any known block + +about to do 22 [-1] +Invalid read of size 4 + at 0x........: main (base.c:22) + Address 0x........ is not derived from any known block + + +ERROR SUMMARY: 5 errors from 5 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/base.vgtest b/exp-sgcheck/tests/base.vgtest new file mode 100644 index 00000000..7aa99d00 --- /dev/null +++ b/exp-sgcheck/tests/base.vgtest @@ -0,0 +1,3 @@ +prereq: ./is_arch_supported +prog: base +stderr_filter: filter_add diff --git a/exp-sgcheck/tests/ccc.cpp b/exp-sgcheck/tests/ccc.cpp new file mode 100644 index 00000000..abd3119a --- /dev/null +++ b/exp-sgcheck/tests/ccc.cpp @@ -0,0 +1,41 @@ +#define _XOPEN_SOURCE 600 // to enable posix_memalign() +#include <assert.h> +#include <stdlib.h> +#include <malloc.h> // for memalign() +static __attribute__((noinline)) void bar ( int ); /* fwds */ +int main(void) { + int sum = 0; + int* x1 = (int*)malloc(sizeof(int)); + int* x2 = new int; + int* x3 = new int[10]; + int* x4 = (int*)calloc(1, sizeof(int)); + int* x5 = (int*)memalign(8, sizeof(int)); + int* x6; void* v6; + int res = posix_memalign(&v6, 8, sizeof(int)); x6 = (int*)v6; + assert(NULL != x1 && NULL != x2 && NULL != x3 && NULL != x4 && + NULL != x5 && 0 == res); + + __asm__ __volatile__("":::"memory"); + // all underruns + sum += x1[-1]; __asm__ __volatile__("":::"memory"); bar(1); + sum += x2[-1]; __asm__ __volatile__("":::"memory"); bar(2); + sum += x3[-1]; __asm__ __volatile__("":::"memory"); bar(3); + sum += x4[-1]; __asm__ __volatile__("":::"memory"); bar(4); + sum += x5[-1]; __asm__ __volatile__("":::"memory"); bar(5); + sum += x6[-1]; __asm__ __volatile__("":::"memory"); bar(6); + __asm__ __volatile__("":::"memory"); + return sum; +} + +/* What's with all this __asm__ __volatile__ stuff? Well, it's an + attempt to get gcc-4.1.2 not to claim the memory references that + we're interested in -- x1[-1] through x6[-1] -- appear on different + lines than they really do. By its own rules, gcc can't move code + across an __asm__ __volatile__, and the "memory" item says each one + clobbers memory in some way which gcc can't know, so that probably + (!) persuades it not to carry memory CSEs around either. */ + +static __attribute__((noinline)) void bar ( int x ) +{ + __asm__ __volatile__("":::"memory"); +} diff --git a/exp-sgcheck/tests/ccc.stderr.exp-glibc25-amd64 b/exp-sgcheck/tests/ccc.stderr.exp-glibc25-amd64 new file mode 100644 index 00000000..37cbad37 --- /dev/null +++ b/exp-sgcheck/tests/ccc.stderr.exp-glibc25-amd64 @@ -0,0 +1,46 @@ + +Invalid read of size 4 + at 0x........: main (ccc.cpp:20) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:8) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:21) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: ...operator new... (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:9) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:22) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: ...operator new[]... (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:10) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:22) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: calloc (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:11) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:23) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: memalign (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:12) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:24) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: memalign (vg_replace_malloc.c:...) + by 0x........: posix_memalign (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:14) + + +ERROR SUMMARY: 6 errors from 6 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/ccc.stderr.exp-glibc27-x86 b/exp-sgcheck/tests/ccc.stderr.exp-glibc27-x86 new file mode 100644 index 00000000..cff83e99 --- /dev/null +++ b/exp-sgcheck/tests/ccc.stderr.exp-glibc27-x86 @@ -0,0 +1,46 @@ + +Invalid read of size 4 + at 0x........: main (ccc.cpp:20) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:8) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:21) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: ...operator new... (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:9) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:22) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: ...operator new[]... (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:10) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:23) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: calloc (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:11) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:24) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: memalign (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:12) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:25) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: memalign (vg_replace_malloc.c:...) + by 0x........: posix_memalign (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:14) + + +ERROR SUMMARY: 6 errors from 6 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/ccc.stderr.exp-glibc28-amd64 b/exp-sgcheck/tests/ccc.stderr.exp-glibc28-amd64 new file mode 100644 index 00000000..0e35bcbf --- /dev/null +++ b/exp-sgcheck/tests/ccc.stderr.exp-glibc28-amd64 @@ -0,0 +1,46 @@ + +Invalid read of size 4 + at 0x........: main (ccc.cpp:20) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:8) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:21) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: ...operator new... (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:9) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:22) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: ...operator new[]... (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:10) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:23) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: calloc (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:11) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:24) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: memalign (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:12) + +Invalid read of size 4 + at 0x........: main (ccc.cpp:22) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: memalign (vg_replace_malloc.c:...) + by 0x........: posix_memalign (vg_replace_malloc.c:...) + by 0x........: main (ccc.cpp:14) + + +ERROR SUMMARY: 6 errors from 6 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/ccc.vgtest b/exp-sgcheck/tests/ccc.vgtest new file mode 100644 index 00000000..d6d7ae16 --- /dev/null +++ b/exp-sgcheck/tests/ccc.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: ccc diff --git a/exp-sgcheck/tests/cmp.c b/exp-sgcheck/tests/cmp.c new file mode 100644 index 00000000..049295b8 --- /dev/null +++ b/exp-sgcheck/tests/cmp.c @@ -0,0 +1,27 @@ +#include <stdlib.h> + +// The comparisons use SUB instructions, and this can result in having a +// (nonptr - ptr) situation legitimately; at one point I was flagging +// errors when that happened. + +int main(void) +{ + char* buf = malloc(sizeof(char) * 6); + + // Known zero non-pointer + char* nz = (char*)((long)buf^(long)buf); // known non-pointer + + // Unknown zero nonptr; make them zero but unknown + char* unz; + ((char*)&unz)[0] = '\0'; + ((char*)&unz)[1] = '\0'; + ((char*)&unz)[2] = '\0'; + ((char*)&unz)[3] = '\0'; + + if (buf == nz) return 1; + if (nz == buf) return 1; // --> n - p, but legitimate + if (buf == unz) return 1; + if (unz == buf) return 1; + + return 0; +} diff --git a/exp-sgcheck/tests/cmp.stderr.exp b/exp-sgcheck/tests/cmp.stderr.exp new file mode 100644 index 00000000..d18786f8 --- /dev/null +++ b/exp-sgcheck/tests/cmp.stderr.exp @@ -0,0 +1,3 @@ + + +ERROR SUMMARY: 0 errors from 0 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/cmp.vgtest-disabled b/exp-sgcheck/tests/cmp.vgtest-disabled new file mode 100644 index 00000000..9b73f143 --- /dev/null +++ b/exp-sgcheck/tests/cmp.vgtest-disabled @@ -0,0 +1 @@ +prog: cmp diff --git a/exp-sgcheck/tests/filter_add b/exp-sgcheck/tests/filter_add new file mode 100755 index 00000000..ad8fbbc9 --- /dev/null +++ b/exp-sgcheck/tests/filter_add @@ -0,0 +1,8 @@ +#! /bin/sh + +dir=`dirname $0` + +$dir/filter_stderr | + +# Anonymise "before" distances (if greater than 9 bytes) +sed "s/Address 0x........ is [0-9][0-9]\+ bytes /Address 0x........ is ... bytes /" diff --git a/exp-sgcheck/tests/filter_stderr b/exp-sgcheck/tests/filter_stderr new file mode 100755 index 00000000..f315d9e1 --- /dev/null +++ b/exp-sgcheck/tests/filter_stderr @@ -0,0 +1,38 @@ +#! /bin/sh + +dir=`dirname $0` + +$dir/../../tests/filter_stderr_basic | + +# Anonymise addresses +$dir/../../tests/filter_addresses | + +# Anonymise paths like "(in /foo/bar/libc-baz.so)" +sed "s/(in \/.*libc.*)$/(in \/...libc...)/" | +sed "s/(in \/.*libpthread.*)$/(in \/...libpthread...)/" | + +# Anonymise paths like "__libc_start_main (../foo/bar/libc-quux.c:129)" +sed "s/__libc_\(.*\) (.*)$/__libc_\1 (...libc...)/" | + +# Remove preambly stuff; also postambly stuff +sed \ +-e "/^exp-ptrcheck, a heap, stack and global array overrun detector$/d" \ +-e "/^NOTE: This is an Experimental-Class Valgrind Tool$/d" \ +-e "/^Copyright (C) 2003-201., and GNU GPL'd, by OpenWorks Ltd et al.$/d" \ +-e "/^For counts of detected and suppressed errors, rerun with: -v$/d" | + +# Tidy up in cases where glibc (+ libdl + libpthread + ld) have +# been built with debugging information, hence source locs are present. +sed \ +-e "s/ vfprintf (.*)/ .../" \ +-e "s/ vsprintf (.*)/ .../" \ +-e "s/ sprintf (.*)/ .../" \ +-e "s/ printf (.*)/ .../" \ +-e "s/ strdup (.*)/ .../" \ +-e "s/(pthread_key_create.c:[0-9]*)/(in \/...libpthread...)/" \ +-e "s/(genops.c:[0-9]*)/(in \/...libc...)/" \ +-e "s/(syscall-template.S:[0-9]*)/(in \/...libc...)/" | + +# Anonymise line numbers in h_intercepts.c. +sed "s/h_intercepts.c:[0-9]*/h_intercepts.c:.../" + diff --git a/exp-sgcheck/tests/filter_suppgen b/exp-sgcheck/tests/filter_suppgen new file mode 100755 index 00000000..6a95de53 --- /dev/null +++ b/exp-sgcheck/tests/filter_suppgen @@ -0,0 +1,11 @@ + +#! /bin/sh + +dir=`dirname $0` + +$dir/filter_stderr | + +# Anonymise "obj:" path +sed "s/obj:.*\/annelid\/tests\/supp/obj:*\/annelid\/tests\/supp/" + + diff --git a/exp-sgcheck/tests/fp.c b/exp-sgcheck/tests/fp.c new file mode 100644 index 00000000..8bcf1ad6 --- /dev/null +++ b/exp-sgcheck/tests/fp.c @@ -0,0 +1,17 @@ + +#include <stdlib.h> + +int main ( void ) +{ + double* dp = malloc(sizeof(double)); + float* fp = malloc(sizeof(float)); + + *dp += 3.0; // ok + *fp += 30.0; // ok + free(dp); + free(fp); + *dp += 3.0; // bad, been freed + *fp += 30.0; // bad, been freed + + return 0; +} diff --git a/exp-sgcheck/tests/fp.stderr.exp b/exp-sgcheck/tests/fp.stderr.exp new file mode 100644 index 00000000..11e99884 --- /dev/null +++ b/exp-sgcheck/tests/fp.stderr.exp @@ -0,0 +1,31 @@ + +Invalid read of size 8 + at 0x........: main (fp.c:13) + Address 0x........ is 0 bytes inside the accessing pointer's + once-legitimate range, a block of size 8 free'd + at 0x........: free (vg_replace_malloc.c:...) + by 0x........: main (fp.c:11) + +Invalid write of size 8 + at 0x........: main (fp.c:13) + Address 0x........ is 0 bytes inside the accessing pointer's + once-legitimate range, a block of size 8 free'd + at 0x........: free (vg_replace_malloc.c:...) + by 0x........: main (fp.c:11) + +Invalid read of size 4 + at 0x........: main (fp.c:14) + Address 0x........ is 0 bytes inside the accessing pointer's + once-legitimate range, a block of size 4 free'd + at 0x........: free (vg_replace_malloc.c:...) + by 0x........: main (fp.c:12) + +Invalid write of size 4 + at 0x........: main (fp.c:14) + Address 0x........ is 0 bytes inside the accessing pointer's + once-legitimate range, a block of size 4 free'd + at 0x........: free (vg_replace_malloc.c:...) + by 0x........: main (fp.c:12) + + +ERROR SUMMARY: 4 errors from 4 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/fp.vgtest b/exp-sgcheck/tests/fp.vgtest new file mode 100644 index 00000000..bd93cf80 --- /dev/null +++ b/exp-sgcheck/tests/fp.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: fp diff --git a/exp-sgcheck/tests/globalerr.c b/exp-sgcheck/tests/globalerr.c new file mode 100644 index 00000000..5b42763e --- /dev/null +++ b/exp-sgcheck/tests/globalerr.c @@ -0,0 +1,15 @@ + +#include <stdio.h> + +short a[7]; +static short b[7]; + +int main ( void ) +{ + int i; + short sum; + for (i = 0; i < 7+1; i++) { + sum += a[i] * b[i]; + } + return 1 & ((unsigned int)sum / 1000000); +} diff --git a/exp-sgcheck/tests/globalerr.stderr.exp-glibc28-amd64 b/exp-sgcheck/tests/globalerr.stderr.exp-glibc28-amd64 new file mode 100644 index 00000000..b80c8ca4 --- /dev/null +++ b/exp-sgcheck/tests/globalerr.stderr.exp-glibc28-amd64 @@ -0,0 +1,15 @@ + +Invalid read of size 2 + at 0x........: main (globalerr.c:12) + Address 0x........ expected vs actual: + Expected: global array "a" in object with soname "NONE" + Actual: unknown + +Invalid read of size 2 + at 0x........: main (globalerr.c:12) + Address 0x........ expected vs actual: + Expected: global array "b" in object with soname "NONE" + Actual: unknown + + +ERROR SUMMARY: 2 errors from 2 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/globalerr.stdout.exp b/exp-sgcheck/tests/globalerr.stdout.exp new file mode 100644 index 00000000..e69de29b --- /dev/null +++ b/exp-sgcheck/tests/globalerr.stdout.exp diff --git a/exp-sgcheck/tests/globalerr.vgtest b/exp-sgcheck/tests/globalerr.vgtest new file mode 100644 index 00000000..c6749cb4 --- /dev/null +++ b/exp-sgcheck/tests/globalerr.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: globalerr diff --git a/exp-sgcheck/tests/hackedbz2.c b/exp-sgcheck/tests/hackedbz2.c new file mode 100644 index 00000000..0d3d8d46 --- /dev/null +++ b/exp-sgcheck/tests/hackedbz2.c @@ -0,0 +1,6537 @@ + +/* This is a very slightly modified version of perf/bz2.c, with a + single change that causes it to overrun a global array by one byte. + The change in question is a change of the size of myprintf_buf from + 1000 to 70, at line 1278. ptrcheck should report exactly one + error, resulting from an out of range access to this array. */ + +// This benchmark is basically bzip2 (mashed to be a single file) +// compressing and decompressing some data. It tests Valgrind's handling of +// realistic and "difficult" (ie. lots of branches and memory accesses) +// integer code. Execution is spread out over quite a few basic blocks; +// --profile-flags indicates that to get to the top 90%th percentile of +// dynamic BB counts requires considering the top 51 basic blocks + +// This program can be used both as part of the performance test +// suite, in which case we want it to run for quite a while, +// and as part of the regression (correctness) test suite, in +// which case we want it to run quickly and be verbose. +// So it does the latter iff given a command line arg. + +// Licensing: the code within is mostly taken from bzip2, which has a BSD +// license. There is a little code from VEX, which is licensed under GPLv2 +// And it's all written by Julian Seward. + +#define BZ_NO_STDIO + + +/*-------------------------------------------------------------*/ +/*--- Private header file for the library. ---*/ +/*--- bzlib_private.h ---*/ +/*-------------------------------------------------------------*/ + +/*-- + This file is a part of bzip2 and/or libbzip2, a program and + library for lossless, block-sorting data compression. + + Copyright (C) 1996-2004 Julian R Seward. All rights reserved. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions + are met: + + 1. Redistributions of source code must retain the above copyright + notice, this list of conditions and the following disclaimer. + + 2. The origin of this software must not be misrepresented; you must + not claim that you wrote the original software. If you use this + software in a product, an acknowledgment in the product + documentation would be appreciated but is not required. + + 3. Altered source versions must be plainly marked as such, and must + not be misrepresented as being the original software. + + 4. The name of the author may not be used to endorse or promote + products derived from this software without specific prior written + permission. + + THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS + OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED + WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY + DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE + GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS + INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, + WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING + NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS + SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + + Julian Seward, Cambridge, UK. + jseward@bzip.org + bzip2/libbzip2 version 1.0 of 21 March 2000 + + This program is based on (at least) the work of: + Mike Burrows + David Wheeler + Peter Fenwick + Alistair Moffat + Radford Neal + Ian H. Witten + Robert Sedgewick + Jon L. Bentley + + For more information on these sources, see the manual. +--*/ + + +#ifndef _BZLIB_PRIVATE_H +#define _BZLIB_PRIVATE_H + +#include <stdlib.h> + +#ifndef BZ_NO_STDIO +#include <stdio.h> +#include <ctype.h> +#include <string.h> +#endif + + +/*-------------------------------------------------------------*/ +/*--- Public header file for the library. ---*/ +/*--- bzlib.h ---*/ +/*-------------------------------------------------------------*/ + +/*-- + This file is a part of bzip2 and/or libbzip2, a program and + library for lossless, block-sorting data compression. + + Copyright (C) 1996-2004 Julian R Seward. All rights reserved. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions + are met: + + 1. Redistributions of source code must retain the above copyright + notice, this list of conditions and the following disclaimer. + + 2. The origin of this software must not be misrepresented; you must + not claim that you wrote the original software. If you use this + software in a product, an acknowledgment in the product + documentation would be appreciated but is not required. + + 3. Altered source versions must be plainly marked as such, and must + not be misrepresented as being the original software. + + 4. The name of the author may not be used to endorse or promote + products derived from this software without specific prior written + permission. + + THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS + OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED + WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY + DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE + GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS + INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, + WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING + NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS + SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + + Julian Seward, Cambridge, UK. + jseward@bzip.org + bzip2/libbzip2 version 1.0 of 21 March 2000 + + This program is based on (at least) the work of: + Mike Burrows + David Wheeler + Peter Fenwick + Alistair Moffat + Radford Neal + Ian H. Witten + Robert Sedgewick + Jon L. Bentley + + For more information on these sources, see the manual. +--*/ + + +#ifndef _BZLIB_H +#define _BZLIB_H + +#ifdef __cplusplus +extern "C" { +#endif + +#define BZ_RUN 0 +#define BZ_FLUSH 1 +#define BZ_FINISH 2 + +#define BZ_OK 0 +#define BZ_RUN_OK 1 +#define BZ_FLUSH_OK 2 +#define BZ_FINISH_OK 3 +#define BZ_STREAM_END 4 +#define BZ_SEQUENCE_ERROR (-1) +#define BZ_PARAM_ERROR (-2) +#define BZ_MEM_ERROR (-3) +#define BZ_DATA_ERROR (-4) +#define BZ_DATA_ERROR_MAGIC (-5) +#define BZ_IO_ERROR (-6) +#define BZ_UNEXPECTED_EOF (-7) +#define BZ_OUTBUFF_FULL (-8) +#define BZ_CONFIG_ERROR (-9) + +typedef + struct { + char *next_in; + unsigned int avail_in; + unsigned int total_in_lo32; + unsigned int total_in_hi32; + + char *next_out; + unsigned int avail_out; + unsigned int total_out_lo32; + unsigned int total_out_hi32; + + void *state; + + void *(*bzalloc)(void *,int,int); + void (*bzfree)(void *,void *); + void *opaque; + } + bz_stream; + + +#ifndef BZ_IMPORT +#define BZ_EXPORT +#endif + +#ifndef BZ_NO_STDIO +/* Need a definitition for FILE */ +#include <stdio.h> +#endif + +#ifdef _WIN32 +# include <windows.h> +# ifdef small + /* windows.h define small to char */ +# undef small +# endif +# ifdef BZ_EXPORT +# define BZ_API(func) WINAPI func +# define BZ_EXTERN extern +# else + /* import windows dll dynamically */ +# define BZ_API(func) (WINAPI * func) +# define BZ_EXTERN +# endif +#else +# define BZ_API(func) func +# define BZ_EXTERN extern +#endif + + +/*-- Core (low-level) library functions --*/ + +BZ_EXTERN int BZ_API(BZ2_bzCompressInit) ( + bz_stream* strm, + int blockSize100k, + int verbosity, + int workFactor + ); + +BZ_EXTERN int BZ_API(BZ2_bzCompress) ( + bz_stream* strm, + int action + ); + +BZ_EXTERN int BZ_API(BZ2_bzCompressEnd) ( + bz_stream* strm + ); + +BZ_EXTERN int BZ_API(BZ2_bzDecompressInit) ( + bz_stream *strm, + int verbosity, + int small + ); + +BZ_EXTERN int BZ_API(BZ2_bzDecompress) ( + bz_stream* strm + ); + +BZ_EXTERN int BZ_API(BZ2_bzDecompressEnd) ( + bz_stream *strm + ); + + + +/*-- High(er) level library functions --*/ + +#ifndef BZ_NO_STDIO +#define BZ_MAX_UNUSED 5000 + +typedef void BZFILE; + +BZ_EXTERN BZFILE* BZ_API(BZ2_bzReadOpen) ( + int* bzerror, + FILE* f, + int verbosity, + int small, + void* unused, + int nUnused + ); + +BZ_EXTERN void BZ_API(BZ2_bzReadClose) ( + int* bzerror, + BZFILE* b + ); + +BZ_EXTERN void BZ_API(BZ2_bzReadGetUnused) ( + int* bzerror, + BZFILE* b, + void** unused, + int* nUnused + ); + +BZ_EXTERN int BZ_API(BZ2_bzRead) ( + int* bzerror, + BZFILE* b, + void* buf, + int len + ); + +BZ_EXTERN BZFILE* BZ_API(BZ2_bzWriteOpen) ( + int* bzerror, + FILE* f, + int blockSize100k, + int verbosity, + int workFactor + ); + +BZ_EXTERN void BZ_API(BZ2_bzWrite) ( + int* bzerror, + BZFILE* b, + void* buf, + int len + ); + +BZ_EXTERN void BZ_API(BZ2_bzWriteClose) ( + int* bzerror, + BZFILE* b, + int abandon, + unsigned int* nbytes_in, + unsigned int* nbytes_out + ); + +BZ_EXTERN void BZ_API(BZ2_bzWriteClose64) ( + int* bzerror, + BZFILE* b, + int abandon, + unsigned int* nbytes_in_lo32, + unsigned int* nbytes_in_hi32, + unsigned int* nbytes_out_lo32, + unsigned int* nbytes_out_hi32 + ); +#endif + + +/*-- Utility functions --*/ + +BZ_EXTERN int BZ_API(BZ2_bzBuffToBuffCompress) ( + char* dest, + unsigned int* destLen, + char* source, + unsigned int sourceLen, + int blockSize100k, + int verbosity, + int workFactor + ); + +BZ_EXTERN int BZ_API(BZ2_bzBuffToBuffDecompress) ( + char* dest, + unsigned int* destLen, + char* source, + unsigned int sourceLen, + int small, + int verbosity + ); + + +/*-- + Code contributed by Yoshioka Tsuneo + (QWF00133@niftyserve.or.jp/tsuneo-y@is.aist-nara.ac.jp), + to support better zlib compatibility. + This code is not _officially_ part of libbzip2 (yet); + I haven't tested it, documented it, or considered the + threading-safeness of it. + If this code breaks, please contact both Yoshioka and me. +--*/ + +BZ_EXTERN const char * BZ_API(BZ2_bzlibVersion) ( + void + ); + +#ifndef BZ_NO_STDIO +BZ_EXTERN BZFILE * BZ_API(BZ2_bzopen) ( + const char *path, + const char *mode + ); + +BZ_EXTERN BZFILE * BZ_API(BZ2_bzdopen) ( + int fd, + const char *mode + ); + +BZ_EXTERN int BZ_API(BZ2_bzread) ( + BZFILE* b, + void* buf, + int len + ); + +BZ_EXTERN int BZ_API(BZ2_bzwrite) ( + BZFILE* b, + void* buf, + int len + ); + +BZ_EXTERN int BZ_API(BZ2_bzflush) ( + BZFILE* b + ); + +BZ_EXTERN void BZ_API(BZ2_bzclose) ( + BZFILE* b + ); + +BZ_EXTERN const char * BZ_API(BZ2_bzerror) ( + BZFILE *b, + int *errnum + ); +#endif + +#ifdef __cplusplus +} +#endif + +#endif + +/*-------------------------------------------------------------*/ +/*--- end bzlib.h ---*/ +/*-------------------------------------------------------------*/ + + + + +/*-- General stuff. --*/ + +#define BZ_VERSION "1.0.3, 17-Oct-2004" + +typedef char Char; +typedef unsigned char Bool; +typedef unsigned char UChar; +typedef int Int32; +typedef unsigned int UInt32; +typedef short Int16; +typedef unsigned short UInt16; + +#define True ((Bool)1) +#define False ((Bool)0) + +#ifndef __GNUC__ +#define __inline__ /* */ +#endif + +#ifndef BZ_NO_STDIO +extern void BZ2_bz__AssertH__fail ( int errcode ); +#define AssertH(cond,errcode) \ + { if (!(cond)) BZ2_bz__AssertH__fail ( errcode ); } +#if BZ_DEBUG +#define AssertD(cond,msg) \ + { if (!(cond)) { \ + fprintf ( stderr, \ + "\n\nlibbzip2(debug build): internal error\n\t%s\n", msg );\ + exit(1); \ + }} +#else +#define AssertD(cond,msg) /* */ +#endif +#define VPrintf0(zf) \ + fprintf(stderr,zf) +#define VPrintf1(zf,za1) \ + fprintf(stderr,zf,za1) +#define VPrintf2(zf,za1,za2) \ + fprintf(stderr,zf,za1,za2) +#define VPrintf3(zf,za1,za2,za3) \ + fprintf(stderr,zf,za1,za2,za3) +#define VPrintf4(zf,za1,za2,za3,za4) \ + fprintf(stderr,zf,za1,za2,za3,za4) +#define VPrintf5(zf,za1,za2,za3,za4,za5) \ + fprintf(stderr,zf,za1,za2,za3,za4,za5) +#else +extern void bz_internal_error ( int errcode ); +#define AssertH(cond,errcode) \ + { if (!(cond)) bz_internal_error ( errcode ); } +#define AssertD(cond,msg) /* */ +#define VPrintf0(zf) \ + vex_printf(zf) +#define VPrintf1(zf,za1) \ + vex_printf(zf,za1) +#define VPrintf2(zf,za1,za2) \ + vex_printf(zf,za1,za2) +#define VPrintf3(zf,za1,za2,za3) \ + vex_printf(zf,za1,za2,za3) +#define VPrintf4(zf,za1,za2,za3,za4) \ + vex_printf(zf,za1,za2,za3,za4) +#define VPrintf5(zf,za1,za2,za3,za4,za5) \ + vex_printf(zf,za1,za2,za3,za4,za5) +#endif + + +#define BZALLOC(nnn) (strm->bzalloc)(strm->opaque,(nnn),1) +#define BZFREE(ppp) (strm->bzfree)(strm->opaque,(ppp)) + + +/*-- Header bytes. --*/ + +#define BZ_HDR_B 0x42 /* 'B' */ +#define BZ_HDR_Z 0x5a /* 'Z' */ +#define BZ_HDR_h 0x68 /* 'h' */ +#define BZ_HDR_0 0x30 /* '0' */ + +/*-- Constants for the back end. --*/ + +#define BZ_MAX_ALPHA_SIZE 258 +#define BZ_MAX_CODE_LEN 23 + +#define BZ_RUNA 0 +#define BZ_RUNB 1 + +#define BZ_N_GROUPS 6 +#define BZ_G_SIZE 50 +#define BZ_N_ITERS 4 + +#define BZ_MAX_SELECTORS (2 + (900000 / BZ_G_SIZE)) + + + +/*-- Stuff for randomising repetitive blocks. --*/ + +extern Int32 BZ2_rNums[512]; + +#define BZ_RAND_DECLS \ + Int32 rNToGo; \ + Int32 rTPos \ + +#define BZ_RAND_INIT_MASK \ + s->rNToGo = 0; \ + s->rTPos = 0 \ + +#define BZ_RAND_MASK ((s->rNToGo == 1) ? 1 : 0) + +#define BZ_RAND_UPD_MASK \ + if (s->rNToGo == 0) { \ + s->rNToGo = BZ2_rNums[s->rTPos]; \ + s->rTPos++; \ + if (s->rTPos == 512) s->rTPos = 0; \ + } \ + s->rNToGo--; + + + +/*-- Stuff for doing CRCs. --*/ + +extern UInt32 BZ2_crc32Table[256]; + +#define BZ_INITIALISE_CRC(crcVar) \ +{ \ + crcVar = 0xffffffffL; \ +} + +#define BZ_FINALISE_CRC(crcVar) \ +{ \ + crcVar = ~(crcVar); \ +} + +#define BZ_UPDATE_CRC(crcVar,cha) \ +{ \ + crcVar = (crcVar << 8) ^ \ + BZ2_crc32Table[(crcVar >> 24) ^ \ + ((UChar)cha)]; \ +} + + + +/*-- States and modes for compression. --*/ + +#define BZ_M_IDLE 1 +#define BZ_M_RUNNING 2 +#define BZ_M_FLUSHING 3 +#define BZ_M_FINISHING 4 + +#define BZ_S_OUTPUT 1 +#define BZ_S_INPUT 2 + +#define BZ_N_RADIX 2 +#define BZ_N_QSORT 12 +#define BZ_N_SHELL 18 +#define BZ_N_OVERSHOOT (BZ_N_RADIX + BZ_N_QSORT + BZ_N_SHELL + 2) + + + + +/*-- Structure holding all the compression-side stuff. --*/ + +typedef + struct { + /* pointer back to the struct bz_stream */ + bz_stream* strm; + + /* mode this stream is in, and whether inputting */ + /* or outputting data */ + Int32 mode; + Int32 state; + + /* remembers avail_in when flush/finish requested */ + UInt32 avail_in_expect; + + /* for doing the block sorting */ + UInt32* arr1; + UInt32* arr2; + UInt32* ftab; + Int32 origPtr; + + /* aliases for arr1 and arr2 */ + UInt32* ptr; + UChar* block; + UInt16* mtfv; + UChar* zbits; + + /* for deciding when to use the fallback sorting algorithm */ + Int32 workFactor; + + /* run-length-encoding of the input */ + UInt32 state_in_ch; + Int32 state_in_len; + BZ_RAND_DECLS; + + /* input and output limits and current posns */ + Int32 nblock; + Int32 nblockMAX; + Int32 numZ; + Int32 state_out_pos; + + /* map of bytes used in block */ + Int32 nInUse; + Bool inUse[256]; + UChar unseqToSeq[256]; + + /* the buffer for bit stream creation */ + UInt32 bsBuff; + Int32 bsLive; + + /* block and combined CRCs */ + UInt32 blockCRC; + UInt32 combinedCRC; + + /* misc administratium */ + Int32 verbosity; + Int32 blockNo; + Int32 blockSize100k; + + /* stuff for coding the MTF values */ + Int32 nMTF; + Int32 mtfFreq [BZ_MAX_ALPHA_SIZE]; + UChar selector [BZ_MAX_SELECTORS]; + UChar selectorMtf[BZ_MAX_SELECTORS]; + + UChar len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE]; + Int32 code [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE]; + Int32 rfreq [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE]; + /* second dimension: only 3 needed; 4 makes index calculations faster */ + UInt32 len_pack[BZ_MAX_ALPHA_SIZE][4]; + + } + EState; + + + +/*-- externs for compression. --*/ + +extern void +BZ2_blockSort ( EState* ); + +extern void +BZ2_compressBlock ( EState*, Bool ); + +extern void +BZ2_bsInitWrite ( EState* ); + +extern void +BZ2_hbAssignCodes ( Int32*, UChar*, Int32, Int32, Int32 ); + +extern void +BZ2_hbMakeCodeLengths ( UChar*, Int32*, Int32, Int32 ); + + + +/*-- states for decompression. --*/ + +#define BZ_X_IDLE 1 +#define BZ_X_OUTPUT 2 + +#define BZ_X_MAGIC_1 10 +#define BZ_X_MAGIC_2 11 +#define BZ_X_MAGIC_3 12 +#define BZ_X_MAGIC_4 13 +#define BZ_X_BLKHDR_1 14 +#define BZ_X_BLKHDR_2 15 +#define BZ_X_BLKHDR_3 16 +#define BZ_X_BLKHDR_4 17 +#define BZ_X_BLKHDR_5 18 +#define BZ_X_BLKHDR_6 19 +#define BZ_X_BCRC_1 20 +#define BZ_X_BCRC_2 21 +#define BZ_X_BCRC_3 22 +#define BZ_X_BCRC_4 23 +#define BZ_X_RANDBIT 24 +#define BZ_X_ORIGPTR_1 25 +#define BZ_X_ORIGPTR_2 26 +#define BZ_X_ORIGPTR_3 27 +#define BZ_X_MAPPING_1 28 +#define BZ_X_MAPPING_2 29 +#define BZ_X_SELECTOR_1 30 +#define BZ_X_SELECTOR_2 31 +#define BZ_X_SELECTOR_3 32 +#define BZ_X_CODING_1 33 +#define BZ_X_CODING_2 34 +#define BZ_X_CODING_3 35 +#define BZ_X_MTF_1 36 +#define BZ_X_MTF_2 37 +#define BZ_X_MTF_3 38 +#define BZ_X_MTF_4 39 +#define BZ_X_MTF_5 40 +#define BZ_X_MTF_6 41 +#define BZ_X_ENDHDR_2 42 +#define BZ_X_ENDHDR_3 43 +#define BZ_X_ENDHDR_4 44 +#define BZ_X_ENDHDR_5 45 +#define BZ_X_ENDHDR_6 46 +#define BZ_X_CCRC_1 47 +#define BZ_X_CCRC_2 48 +#define BZ_X_CCRC_3 49 +#define BZ_X_CCRC_4 50 + + + +/*-- Constants for the fast MTF decoder. --*/ + +#define MTFA_SIZE 4096 +#define MTFL_SIZE 16 + + + +/*-- Structure holding all the decompression-side stuff. --*/ + +typedef + struct { + /* pointer back to the struct bz_stream */ + bz_stream* strm; + + /* state indicator for this stream */ + Int32 state; + + /* for doing the final run-length decoding */ + UChar state_out_ch; + Int32 state_out_len; + Bool blockRandomised; + BZ_RAND_DECLS; + + /* the buffer for bit stream reading */ + UInt32 bsBuff; + Int32 bsLive; + + /* misc administratium */ + Int32 blockSize100k; + Bool smallDecompress; + Int32 currBlockNo; + Int32 verbosity; + + /* for undoing the Burrows-Wheeler transform */ + Int32 origPtr; + UInt32 tPos; + Int32 k0; + Int32 unzftab[256]; + Int32 nblock_used; + Int32 cftab[257]; + Int32 cftabCopy[257]; + + /* for undoing the Burrows-Wheeler transform (FAST) */ + UInt32 *tt; + + /* for undoing the Burrows-Wheeler transform (SMALL) */ + UInt16 *ll16; + UChar *ll4; + + /* stored and calculated CRCs */ + UInt32 storedBlockCRC; + UInt32 storedCombinedCRC; + UInt32 calculatedBlockCRC; + UInt32 calculatedCombinedCRC; + + /* map of bytes used in block */ + Int32 nInUse; + Bool inUse[256]; + Bool inUse16[16]; + UChar seqToUnseq[256]; + + /* for decoding the MTF values */ + UChar mtfa [MTFA_SIZE]; + Int32 mtfbase[256 / MTFL_SIZE]; + UChar selector [BZ_MAX_SELECTORS]; + UChar selectorMtf[BZ_MAX_SELECTORS]; + UChar len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE]; + + Int32 limit [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE]; + Int32 base [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE]; + Int32 perm [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE]; + Int32 minLens[BZ_N_GROUPS]; + + /* save area for scalars in the main decompress code */ + Int32 save_i; + Int32 save_j; + Int32 save_t; + Int32 save_alphaSize; + Int32 save_nGroups; + Int32 save_nSelectors; + Int32 save_EOB; + Int32 save_groupNo; + Int32 save_groupPos; + Int32 save_nextSym; + Int32 save_nblockMAX; + Int32 save_nblock; + Int32 save_es; + Int32 save_N; + Int32 save_curr; + Int32 save_zt; + Int32 save_zn; + Int32 save_zvec; + Int32 save_zj; + Int32 save_gSel; + Int32 save_gMinlen; + Int32* save_gLimit; + Int32* save_gBase; + Int32* save_gPerm; + + } + DState; + + + +/*-- Macros for decompression. --*/ + +#define BZ_GET_FAST(cccc) \ + s->tPos = s->tt[s->tPos]; \ + cccc = (UChar)(s->tPos & 0xff); \ + s->tPos >>= 8; + +#define BZ_GET_FAST_C(cccc) \ + c_tPos = c_tt[c_tPos]; \ + cccc = (UChar)(c_tPos & 0xff); \ + c_tPos >>= 8; + +#define SET_LL4(i,n) \ + { if (((i) & 0x1) == 0) \ + s->ll4[(i) >> 1] = (s->ll4[(i) >> 1] & 0xf0) | (n); else \ + s->ll4[(i) >> 1] = (s->ll4[(i) >> 1] & 0x0f) | ((n) << 4); \ + } + +#define GET_LL4(i) \ + ((((UInt32)(s->ll4[(i) >> 1])) >> (((i) << 2) & 0x4)) & 0xF) + +#define SET_LL(i,n) \ + { s->ll16[i] = (UInt16)(n & 0x0000ffff); \ + SET_LL4(i, n >> 16); \ + } + +#define GET_LL(i) \ + (((UInt32)s->ll16[i]) | (GET_LL4(i) << 16)) + +#define BZ_GET_SMALL(cccc) \ + cccc = BZ2_indexIntoF ( s->tPos, s->cftab ); \ + s->tPos = GET_LL(s->tPos); + + +/*-- externs for decompression. --*/ + +extern Int32 +BZ2_indexIntoF ( Int32, Int32* ); + +extern Int32 +BZ2_decompress ( DState* ); + +extern void +BZ2_hbCreateDecodeTables ( Int32*, Int32*, Int32*, UChar*, + Int32, Int32, Int32 ); + + +#endif + + +/*-- BZ_NO_STDIO seems to make NULL disappear on some platforms. --*/ + +#ifdef BZ_NO_STDIO +#ifndef NULL +#define NULL 0 +#endif +#endif + + +/*-------------------------------------------------------------*/ +/*--- end bzlib_private.h ---*/ +/*-------------------------------------------------------------*/ + + +/* Something which has the same size as void* on the host. That is, + it is 32 bits on a 32-bit host and 64 bits on a 64-bit host, and so + it can safely be coerced to and from a pointer type on the host + machine. */ +typedef unsigned long HWord; +typedef char HChar; +typedef signed int Int; +typedef unsigned int UInt; + +typedef signed long long int Long; +typedef unsigned long long int ULong; + + +///////////////////////////////////////////////////////////////////// +///////////////////////////////////////////////////////////////////// + +static HWord (*serviceFn)(HWord,HWord) = 0; + +#if 0 +static char* my_strcpy ( char* dest, const char* src ) +{ + char* dest_orig = dest; + while (*src) *dest++ = *src++; + *dest = 0; + return dest_orig; +} + +static void* my_memcpy ( void *dest, const void *src, int sz ) +{ + const char *s = (const char *)src; + char *d = (char *)dest; + + while (sz--) + *d++ = *s++; + + return dest; +} + +static void* my_memmove( void *dst, const void *src, unsigned int len ) +{ + register char *d; + register char *s; + if ( dst > src ) { + d = (char *)dst + len - 1; + s = (char *)src + len - 1; + while ( len >= 4 ) { + *d-- = *s--; + *d-- = *s--; + *d-- = *s--; + *d-- = *s--; + len -= 4; + } + while ( len-- ) { + *d-- = *s--; + } + } else if ( dst < src ) { + d = (char *)dst; + s = (char *)src; + while ( len >= 4 ) { + *d++ = *s++; + *d++ = *s++; + *d++ = *s++; + *d++ = *s++; + len -= 4; + } + while ( len-- ) { + *d++ = *s++; + } + } + return dst; +} +#endif + +char* my_strcat ( char* dest, const char* src ) +{ + char* dest_orig = dest; + while (*dest) dest++; + while (*src) *dest++ = *src++; + *dest = 0; + return dest_orig; +} + + +///////////////////////////////////////////////////////////////////// + +static void vex_log_bytes ( char* p, int n ) +{ + int i; + for (i = 0; i < n; i++) + (*serviceFn)( 1, (int)p[i] ); +} + +/*---------------------------------------------------------*/ +/*--- vex_printf ---*/ +/*---------------------------------------------------------*/ + +/* This should be the only <...> include in the entire VEX library. + New code for vex_util.c should go above this point. */ +#include <stdarg.h> + +static HChar vex_toupper ( HChar c ) +{ + if (c >= 'a' && c <= 'z') + return c + ('A' - 'a'); + else + return c; +} + +static Int vex_strlen ( const HChar* str ) +{ + Int i = 0; + while (str[i] != 0) i++; + return i; +} + +Bool vex_streq ( const HChar* s1, const HChar* s2 ) +{ + while (True) { + if (*s1 == 0 && *s2 == 0) + return True; + if (*s1 != *s2) + return False; + s1++; + s2++; + } +} + +/* Some flags. */ +#define VG_MSG_SIGNED 1 /* The value is signed. */ +#define VG_MSG_ZJUSTIFY 2 /* Must justify with '0'. */ +#define VG_MSG_LJUSTIFY 4 /* Must justify on the left. */ +#define VG_MSG_PAREN 8 /* Parenthesize if present (for %y) */ +#define VG_MSG_COMMA 16 /* Add commas to numbers (for %d, %u) */ + +/* Copy a string into the buffer. */ +static UInt +myvprintf_str ( void(*send)(HChar), Int flags, Int width, HChar* str, + Bool capitalise ) +{ +# define MAYBE_TOUPPER(ch) (capitalise ? vex_toupper(ch) : (ch)) + UInt ret = 0; + Int i, extra; + Int len = vex_strlen(str); + + if (width == 0) { + ret += len; + for (i = 0; i < len; i++) + send(MAYBE_TOUPPER(str[i])); + return ret; + } + + if (len > width) { + ret += width; + for (i = 0; i < width; i++) + send(MAYBE_TOUPPER(str[i])); + return ret; + } + + extra = width - len; + if (flags & VG_MSG_LJUSTIFY) { + ret += extra; + for (i = 0; i < extra; i++) + send(' '); + } + ret += len; + for (i = 0; i < len; i++) + send(MAYBE_TOUPPER(str[i])); + if (!(flags & VG_MSG_LJUSTIFY)) { + ret += extra; + for (i = 0; i < extra; i++) + send(' '); + } + +# undef MAYBE_TOUPPER + + return ret; +} + +/* Write P into the buffer according to these args: + * If SIGN is true, p is a signed. + * BASE is the base. + * If WITH_ZERO is true, '0' must be added. + * WIDTH is the width of the field. + */ +static UInt +myvprintf_int64 ( void(*send)(HChar), Int flags, Int base, Int width, ULong pL) +{ + HChar buf[40]; + Int ind = 0; + Int i, nc = 0; + Bool neg = False; + HChar *digits = "0123456789ABCDEF"; + UInt ret = 0; + UInt p = (UInt)pL; + + if (base < 2 || base > 16) + return ret; + + if ((flags & VG_MSG_SIGNED) && (Int)p < 0) { + p = - (Int)p; + neg = True; + } + + if (p == 0) + buf[ind++] = '0'; + else { + while (p > 0) { + if ((flags & VG_MSG_COMMA) && 10 == base && + 0 == (ind-nc) % 3 && 0 != ind) + { + buf[ind++] = ','; + nc++; + } + buf[ind++] = digits[p % base]; + p /= base; + } + } + + if (neg) + buf[ind++] = '-'; + + if (width > 0 && !(flags & VG_MSG_LJUSTIFY)) { + for(; ind < width; ind++) { + //vassert(ind < 39); + buf[ind] = ((flags & VG_MSG_ZJUSTIFY) ? '0': ' '); + } + } + + /* Reverse copy to buffer. */ + ret += ind; + for (i = ind -1; i >= 0; i--) { + send(buf[i]); + } + if (width > 0 && (flags & VG_MSG_LJUSTIFY)) { + for(; ind < width; ind++) { + ret++; + send(' '); // Never pad with zeroes on RHS -- changes the value! + } + } + return ret; +} + + +/* A simple vprintf(). */ +static +UInt vprintf_wrk ( void(*send)(HChar), const HChar *format, va_list vargs ) +{ + UInt ret = 0; + int i; + int flags; + int width; + Bool is_long; + + /* We assume that vargs has already been initialised by the + caller, using va_start, and that the caller will similarly + clean up with va_end. + */ + + for (i = 0; format[i] != 0; i++) { + if (format[i] != '%') { + send(format[i]); + ret++; + continue; + } + i++; + /* A '%' has been found. Ignore a trailing %. */ + if (format[i] == 0) + break; + if (format[i] == '%') { + /* `%%' is replaced by `%'. */ + send('%'); + ret++; + continue; + } + flags = 0; + is_long = False; + width = 0; /* length of the field. */ + if (format[i] == '(') { + flags |= VG_MSG_PAREN; + i++; + } + /* If ',' follows '%', commas will be inserted. */ + if (format[i] == ',') { + flags |= VG_MSG_COMMA; + i++; + } + /* If '-' follows '%', justify on the left. */ + if (format[i] == '-') { + flags |= VG_MSG_LJUSTIFY; + i++; + } + /* If '0' follows '%', pads will be inserted. */ + if (format[i] == '0') { + flags |= VG_MSG_ZJUSTIFY; + i++; + } + /* Compute the field length. */ + while (format[i] >= '0' && format[i] <= '9') { + width *= 10; + width += format[i++] - '0'; + } + while (format[i] == 'l') { + i++; + is_long = True; + } + + switch (format[i]) { + case 'd': /* %d */ + flags |= VG_MSG_SIGNED; + if (is_long) + ret += myvprintf_int64(send, flags, 10, width, + (ULong)(va_arg (vargs, Long))); + else + ret += myvprintf_int64(send, flags, 10, width, + (ULong)(va_arg (vargs, Int))); + break; + case 'u': /* %u */ + if (is_long) + ret += myvprintf_int64(send, flags, 10, width, + (ULong)(va_arg (vargs, ULong))); + else + ret += myvprintf_int64(send, flags, 10, width, + (ULong)(va_arg (vargs, UInt))); + break; + case 'p': /* %p */ + ret += 2; + send('0'); + send('x'); + ret += myvprintf_int64(send, flags, 16, width, + (ULong)((HWord)va_arg (vargs, void *))); + break; + case 'x': /* %x */ + if (is_long) + ret += myvprintf_int64(send, flags, 16, width, + (ULong)(va_arg (vargs, ULong))); + else + ret += myvprintf_int64(send, flags, 16, width, + (ULong)(va_arg (vargs, UInt))); + break; + case 'c': /* %c */ + ret++; + send((va_arg (vargs, int))); + break; + case 's': case 'S': { /* %s */ + char *str = va_arg (vargs, char *); + if (str == (char*) 0) str = "(null)"; + ret += myvprintf_str(send, flags, width, str, + (format[i]=='S')); + break; + } +# if 0 + case 'y': { /* %y - print symbol */ + Char buf[100]; + Char *cp = buf; + Addr a = va_arg(vargs, Addr); + + if (flags & VG_MSG_PAREN) + *cp++ = '('; + if (VG_(get_fnname_w_offset)(a, cp, sizeof(buf)-4)) { + if (flags & VG_MSG_PAREN) { + cp += VG_(strlen)(cp); + *cp++ = ')'; + *cp = '\0'; + } + ret += myvprintf_str(send, flags, width, buf, 0); + } + break; + } +# endif + default: + break; + } + } + return ret; +} + + +/* A general replacement for printf(). Note that only low-level + debugging info should be sent via here. The official route is to + to use vg_message(). This interface is deprecated. +*/ +/* XXX re 930: make the buffer just to small (by 1 byte) to be OK + for this particular run. */ +static HChar myprintf_buf[1000 -930]; +static Int n_myprintf_buf; + +static void add_to_myprintf_buf ( HChar c ) +{ + if (c == '\n' || n_myprintf_buf >= 1000-10 /*paranoia*/ ) { + (*vex_log_bytes)( myprintf_buf, vex_strlen(myprintf_buf) ); + n_myprintf_buf = 0; + myprintf_buf[n_myprintf_buf] = 0; + } + myprintf_buf[n_myprintf_buf++] = c; + myprintf_buf[n_myprintf_buf] = 0; +} + +static UInt vex_printf ( const char *format, ... ) +{ + UInt ret; + va_list vargs; + va_start(vargs,format); + + n_myprintf_buf = 0; + myprintf_buf[n_myprintf_buf] = 0; + ret = vprintf_wrk ( add_to_myprintf_buf, format, vargs ); + + if (n_myprintf_buf > 0) { + (*vex_log_bytes)( myprintf_buf, n_myprintf_buf ); + } + + va_end(vargs); + + return ret; +} + +/*---------------------------------------------------------------*/ +/*--- end vex_util.c ---*/ +/*---------------------------------------------------------------*/ + + +///////////////////////////////////////////////////////////////////// +///////////////////////////////////////////////////////////////////// +///////////////////////////////////////////////////////////////////// +///////////////////////////////////////////////////////////////////// + + +/*-------------------------------------------------------------*/ +/*--- Decompression machinery ---*/ +/*--- decompress.c ---*/ +/*-------------------------------------------------------------*/ + +/*-- + This file is a part of bzip2 and/or libbzip2, a program and + library for lossless, block-sorting data compression. + + Copyright (C) 1996-2004 Julian R Seward. All rights reserved. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions + are met: + + 1. Redistributions of source code must retain the above copyright + notice, this list of conditions and the following disclaimer. + + 2. The origin of this software must not be misrepresented; you must + not claim that you wrote the original software. If you use this + software in a product, an acknowledgment in the product + documentation would be appreciated but is not required. + + 3. Altered source versions must be plainly marked as such, and must + not be misrepresented as being the original software. + + 4. The name of the author may not be used to endorse or promote + products derived from this software without specific prior written + permission. + + THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS + OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED + WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY + DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE + GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS + INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, + WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING + NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS + SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + + Julian Seward, Cambridge, UK. + jseward@bzip.org + bzip2/libbzip2 version 1.0 of 21 March 2000 + + This program is based on (at least) the work of: + Mike Burrows + David Wheeler + Peter Fenwick + Alistair Moffat + Radford Neal + Ian H. Witten + Robert Sedgewick + Jon L. Bentley + + For more information on these sources, see the manual. +--*/ + + + + +/*---------------------------------------------------*/ +static +void makeMaps_d ( DState* s ) +{ + Int32 i; + s->nInUse = 0; + for (i = 0; i < 256; i++) + if (s->inUse[i]) { + s->seqToUnseq[s->nInUse] = i; + s->nInUse++; + } +} + + +/*---------------------------------------------------*/ +#define RETURN(rrr) \ + { retVal = rrr; goto save_state_and_return; }; + +#define GET_BITS(lll,vvv,nnn) \ + case lll: s->state = lll; \ + while (True) { \ + if (s->bsLive >= nnn) { \ + UInt32 v; \ + v = (s->bsBuff >> \ + (s->bsLive-nnn)) & ((1 << nnn)-1); \ + s->bsLive -= nnn; \ + vvv = v; \ + break; \ + } \ + if (s->strm->avail_in == 0) RETURN(BZ_OK); \ + s->bsBuff \ + = (s->bsBuff << 8) | \ + ((UInt32) \ + (*((UChar*)(s->strm->next_in)))); \ + s->bsLive += 8; \ + s->strm->next_in++; \ + s->strm->avail_in--; \ + s->strm->total_in_lo32++; \ + if (s->strm->total_in_lo32 == 0) \ + s->strm->total_in_hi32++; \ + } + +#define GET_UCHAR(lll,uuu) \ + GET_BITS(lll,uuu,8) + +#define GET_BIT(lll,uuu) \ + GET_BITS(lll,uuu,1) + +/*---------------------------------------------------*/ +#define GET_MTF_VAL(label1,label2,lval) \ +{ \ + if (groupPos == 0) { \ + groupNo++; \ + if (groupNo >= nSelectors) \ + RETURN(BZ_DATA_ERROR); \ + groupPos = BZ_G_SIZE; \ + gSel = s->selector[groupNo]; \ + gMinlen = s->minLens[gSel]; \ + gLimit = &(s->limit[gSel][0]); \ + gPerm = &(s->perm[gSel][0]); \ + gBase = &(s->base[gSel][0]); \ + } \ + groupPos--; \ + zn = gMinlen; \ + GET_BITS(label1, zvec, zn); \ + while (1) { \ + if (zn > 20 /* the longest code */) \ + RETURN(BZ_DATA_ERROR); \ + if (zvec <= gLimit[zn]) break; \ + zn++; \ + GET_BIT(label2, zj); \ + zvec = (zvec << 1) | zj; \ + }; \ + if (zvec - gBase[zn] < 0 \ + || zvec - gBase[zn] >= BZ_MAX_ALPHA_SIZE) \ + RETURN(BZ_DATA_ERROR); \ + lval = gPerm[zvec - gBase[zn]]; \ +} + + + +/*---------------------------------------------------*/ +__inline__ Int32 BZ2_indexIntoF ( Int32 indx, Int32 *cftab ) +{ + Int32 nb, na, mid; + nb = 0; + na = 256; + do { + mid = (nb + na) >> 1; + if (indx >= cftab[mid]) nb = mid; else na = mid; + } + while (na - nb != 1); + return nb; +} + +/*---------------------------------------------------*/ +Int32 BZ2_decompress ( DState* s ) +{ + UChar uc; + Int32 retVal; + Int32 minLen, maxLen; + bz_stream* strm = s->strm; + + /* stuff that needs to be saved/restored */ + Int32 i; + Int32 j; + Int32 t; + Int32 alphaSize; + Int32 nGroups; + Int32 nSelectors; + Int32 EOB; + Int32 groupNo; + Int32 groupPos; + Int32 nextSym; + Int32 nblockMAX; + Int32 nblock; + Int32 es; + Int32 N; + Int32 curr; + Int32 zt; + Int32 zn; + Int32 zvec; + Int32 zj; + Int32 gSel; + Int32 gMinlen; + Int32* gLimit; + Int32* gBase; + Int32* gPerm; + + if (s->state == BZ_X_MAGIC_1) { + /*initialise the save area*/ + s->save_i = 0; + s->save_j = 0; + s->save_t = 0; + s->save_alphaSize = 0; + s->save_nGroups = 0; + s->save_nSelectors = 0; + s->save_EOB = 0; + s->save_groupNo = 0; + s->save_groupPos = 0; + s->save_nextSym = 0; + s->save_nblockMAX = 0; + s->save_nblock = 0; + s->save_es = 0; + s->save_N = 0; + s->save_curr = 0; + s->save_zt = 0; + s->save_zn = 0; + s->save_zvec = 0; + s->save_zj = 0; + s->save_gSel = 0; + s->save_gMinlen = 0; + s->save_gLimit = NULL; + s->save_gBase = NULL; + s->save_gPerm = NULL; + } + + /*restore from the save area*/ + i = s->save_i; + j = s->save_j; + t = s->save_t; + alphaSize = s->save_alphaSize; + nGroups = s->save_nGroups; + nSelectors = s->save_nSelectors; + EOB = s->save_EOB; + groupNo = s->save_groupNo; + groupPos = s->save_groupPos; + nextSym = s->save_nextSym; + nblockMAX = s->save_nblockMAX; + nblock = s->save_nblock; + es = s->save_es; + N = s->save_N; + curr = s->save_curr; + zt = s->save_zt; + zn = s->save_zn; + zvec = s->save_zvec; + zj = s->save_zj; + gSel = s->save_gSel; + gMinlen = s->save_gMinlen; + gLimit = s->save_gLimit; + gBase = s->save_gBase; + gPerm = s->save_gPerm; + + retVal = BZ_OK; + + switch (s->state) { + + GET_UCHAR(BZ_X_MAGIC_1, uc); + if (uc != BZ_HDR_B) RETURN(BZ_DATA_ERROR_MAGIC); + + GET_UCHAR(BZ_X_MAGIC_2, uc); + if (uc != BZ_HDR_Z) RETURN(BZ_DATA_ERROR_MAGIC); + + GET_UCHAR(BZ_X_MAGIC_3, uc) + if (uc != BZ_HDR_h) RETURN(BZ_DATA_ERROR_MAGIC); + + GET_BITS(BZ_X_MAGIC_4, s->blockSize100k, 8) + if (s->blockSize100k < (BZ_HDR_0 + 1) || + s->blockSize100k > (BZ_HDR_0 + 9)) RETURN(BZ_DATA_ERROR_MAGIC); + s->blockSize100k -= BZ_HDR_0; + + if (s->smallDecompress) { + s->ll16 = BZALLOC( s->blockSize100k * 100000 * sizeof(UInt16) ); + s->ll4 = BZALLOC( + ((1 + s->blockSize100k * 100000) >> 1) * sizeof(UChar) + ); + if (s->ll16 == NULL || s->ll4 == NULL) RETURN(BZ_MEM_ERROR); + } else { + s->tt = BZALLOC( s->blockSize100k * 100000 * sizeof(Int32) ); + if (s->tt == NULL) RETURN(BZ_MEM_ERROR); + } + + GET_UCHAR(BZ_X_BLKHDR_1, uc); + + if (uc == 0x17) goto endhdr_2; + if (uc != 0x31) RETURN(BZ_DATA_ERROR); + GET_UCHAR(BZ_X_BLKHDR_2, uc); + if (uc != 0x41) RETURN(BZ_DATA_ERROR); + GET_UCHAR(BZ_X_BLKHDR_3, uc); + if (uc != 0x59) RETURN(BZ_DATA_ERROR); + GET_UCHAR(BZ_X_BLKHDR_4, uc); + if (uc != 0x26) RETURN(BZ_DATA_ERROR); + GET_UCHAR(BZ_X_BLKHDR_5, uc); + if (uc != 0x53) RETURN(BZ_DATA_ERROR); + GET_UCHAR(BZ_X_BLKHDR_6, uc); + if (uc != 0x59) RETURN(BZ_DATA_ERROR); + + s->currBlockNo++; + if (s->verbosity >= 2) + VPrintf1 ( "\n [%d: huff+mtf ", s->currBlockNo ); + + s->storedBlockCRC = 0; + GET_UCHAR(BZ_X_BCRC_1, uc); + s->storedBlockCRC = (s->storedBlockCRC << 8) | ((UInt32)uc); + GET_UCHAR(BZ_X_BCRC_2, uc); + s->storedBlockCRC = (s->storedBlockCRC << 8) | ((UInt32)uc); + GET_UCHAR(BZ_X_BCRC_3, uc); + s->storedBlockCRC = (s->storedBlockCRC << 8) | ((UInt32)uc); + GET_UCHAR(BZ_X_BCRC_4, uc); + s->storedBlockCRC = (s->storedBlockCRC << 8) | ((UInt32)uc); + + GET_BITS(BZ_X_RANDBIT, s->blockRandomised, 1); + + s->origPtr = 0; + GET_UCHAR(BZ_X_ORIGPTR_1, uc); + s->origPtr = (s->origPtr << 8) | ((Int32)uc); + GET_UCHAR(BZ_X_ORIGPTR_2, uc); + s->origPtr = (s->origPtr << 8) | ((Int32)uc); + GET_UCHAR(BZ_X_ORIGPTR_3, uc); + s->origPtr = (s->origPtr << 8) | ((Int32)uc); + + if (s->origPtr < 0) + RETURN(BZ_DATA_ERROR); + if (s->origPtr > 10 + 100000*s->blockSize100k) + RETURN(BZ_DATA_ERROR); + + /*--- Receive the mapping table ---*/ + for (i = 0; i < 16; i++) { + GET_BIT(BZ_X_MAPPING_1, uc); + if (uc == 1) + s->inUse16[i] = True; else + s->inUse16[i] = False; + } + + for (i = 0; i < 256; i++) s->inUse[i] = False; + + for (i = 0; i < 16; i++) + if (s->inUse16[i]) + for (j = 0; j < 16; j++) { + GET_BIT(BZ_X_MAPPING_2, uc); + if (uc == 1) s->inUse[i * 16 + j] = True; + } + makeMaps_d ( s ); + if (s->nInUse == 0) RETURN(BZ_DATA_ERROR); + alphaSize = s->nInUse+2; + + /*--- Now the selectors ---*/ + GET_BITS(BZ_X_SELECTOR_1, nGroups, 3); + if (nGroups < 2 || nGroups > 6) RETURN(BZ_DATA_ERROR); + GET_BITS(BZ_X_SELECTOR_2, nSelectors, 15); + if (nSelectors < 1) RETURN(BZ_DATA_ERROR); + for (i = 0; i < nSelectors; i++) { + j = 0; + while (True) { + GET_BIT(BZ_X_SELECTOR_3, uc); + if (uc == 0) break; + j++; + if (j >= nGroups) RETURN(BZ_DATA_ERROR); + } + s->selectorMtf[i] = j; + } + + /*--- Undo the MTF values for the selectors. ---*/ + { + UChar pos[BZ_N_GROUPS], tmp, v; + for (v = 0; v < nGroups; v++) pos[v] = v; + + for (i = 0; i < nSelectors; i++) { + v = s->selectorMtf[i]; + tmp = pos[v]; + while (v > 0) { pos[v] = pos[v-1]; v--; } + pos[0] = tmp; + s->selector[i] = tmp; + } + } + + /*--- Now the coding tables ---*/ + for (t = 0; t < nGroups; t++) { + GET_BITS(BZ_X_CODING_1, curr, 5); + for (i = 0; i < alphaSize; i++) { + while (True) { + if (curr < 1 || curr > 20) RETURN(BZ_DATA_ERROR); + GET_BIT(BZ_X_CODING_2, uc); + if (uc == 0) break; + GET_BIT(BZ_X_CODING_3, uc); + if (uc == 0) curr++; else curr--; + } + s->len[t][i] = curr; + } + } + + /*--- Create the Huffman decoding tables ---*/ + for (t = 0; t < nGroups; t++) { + minLen = 32; + maxLen = 0; + for (i = 0; i < alphaSize; i++) { + if (s->len[t][i] > maxLen) maxLen = s->len[t][i]; + if (s->len[t][i] < minLen) minLen = s->len[t][i]; + } + BZ2_hbCreateDecodeTables ( + &(s->limit[t][0]), + &(s->base[t][0]), + &(s->perm[t][0]), + &(s->len[t][0]), + minLen, maxLen, alphaSize + ); + s->minLens[t] = minLen; + } + + /*--- Now the MTF values ---*/ + + EOB = s->nInUse+1; + nblockMAX = 100000 * s->blockSize100k; + groupNo = -1; + groupPos = 0; + + for (i = 0; i <= 255; i++) s->unzftab[i] = 0; + + /*-- MTF init --*/ + { + Int32 ii, jj, kk; + kk = MTFA_SIZE-1; + for (ii = 256 / MTFL_SIZE - 1; ii >= 0; ii--) { + for (jj = MTFL_SIZE-1; jj >= 0; jj--) { + s->mtfa[kk] = (UChar)(ii * MTFL_SIZE + jj); + kk--; + } + s->mtfbase[ii] = kk + 1; + } + } + /*-- end MTF init --*/ + + nblock = 0; + GET_MTF_VAL(BZ_X_MTF_1, BZ_X_MTF_2, nextSym); + + while (True) { + + if (nextSym == EOB) break; + + if (nextSym == BZ_RUNA || nextSym == BZ_RUNB) { + + es = -1; + N = 1; + do { + if (nextSym == BZ_RUNA) es = es + (0+1) * N; else + if (nextSym == BZ_RUNB) es = es + (1+1) * N; + N = N * 2; + GET_MTF_VAL(BZ_X_MTF_3, BZ_X_MTF_4, nextSym); + } + while (nextSym == BZ_RUNA || nextSym == BZ_RUNB); + + es++; + uc = s->seqToUnseq[ s->mtfa[s->mtfbase[0]] ]; + s->unzftab[uc] += es; + + if (s->smallDecompress) + while (es > 0) { + if (nblock >= nblockMAX) RETURN(BZ_DATA_ERROR); + s->ll16[nblock] = (UInt16)uc; + nblock++; + es--; + } + else + while (es > 0) { + if (nblock >= nblockMAX) RETURN(BZ_DATA_ERROR); + s->tt[nblock] = (UInt32)uc; + nblock++; + es--; + }; + + continue; + + } else { + + if (nblock >= nblockMAX) RETURN(BZ_DATA_ERROR); + + /*-- uc = MTF ( nextSym-1 ) --*/ + { + Int32 ii, jj, kk, pp, lno, off; + UInt32 nn; + nn = (UInt32)(nextSym - 1); + + if (nn < MTFL_SIZE) { + /* avoid general-case expense */ + pp = s->mtfbase[0]; + uc = s->mtfa[pp+nn]; + while (nn > 3) { + Int32 z = pp+nn; + s->mtfa[(z) ] = s->mtfa[(z)-1]; + s->mtfa[(z)-1] = s->mtfa[(z)-2]; + s->mtfa[(z)-2] = s->mtfa[(z)-3]; + s->mtfa[(z)-3] = s->mtfa[(z)-4]; + nn -= 4; + } + while (nn > 0) { + s->mtfa[(pp+nn)] = s->mtfa[(pp+nn)-1]; nn--; + }; + s->mtfa[pp] = uc; + } else { + /* general case */ + lno = nn / MTFL_SIZE; + off = nn % MTFL_SIZE; + pp = s->mtfbase[lno] + off; + uc = s->mtfa[pp]; + while (pp > s->mtfbase[lno]) { + s->mtfa[pp] = s->mtfa[pp-1]; pp--; + }; + s->mtfbase[lno]++; + while (lno > 0) { + s->mtfbase[lno]--; + s->mtfa[s->mtfbase[lno]] + = s->mtfa[s->mtfbase[lno-1] + MTFL_SIZE - 1]; + lno--; + } + s->mtfbase[0]--; + s->mtfa[s->mtfbase[0]] = uc; + if (s->mtfbase[0] == 0) { + kk = MTFA_SIZE-1; + for (ii = 256 / MTFL_SIZE-1; ii >= 0; ii--) { + for (jj = MTFL_SIZE-1; jj >= 0; jj--) { + s->mtfa[kk] = s->mtfa[s->mtfbase[ii] + jj]; + kk--; + } + s->mtfbase[ii] = kk + 1; + } + } + } + } + /*-- end uc = MTF ( nextSym-1 ) --*/ + + s->unzftab[s->seqToUnseq[uc]]++; + if (s->smallDecompress) + s->ll16[nblock] = (UInt16)(s->seqToUnseq[uc]); else + s->tt[nblock] = (UInt32)(s->seqToUnseq[uc]); + nblock++; + + GET_MTF_VAL(BZ_X_MTF_5, BZ_X_MTF_6, nextSym); + continue; + } + } + + /* Now we know what nblock is, we can do a better sanity + check on s->origPtr. + */ + if (s->origPtr < 0 || s->origPtr >= nblock) + RETURN(BZ_DATA_ERROR); + + /*-- Set up cftab to facilitate generation of T^(-1) --*/ + s->cftab[0] = 0; + for (i = 1; i <= 256; i++) s->cftab[i] = s->unzftab[i-1]; + for (i = 1; i <= 256; i++) s->cftab[i] += s->cftab[i-1]; + for (i = 0; i <= 256; i++) { + if (s->cftab[i] < 0 || s->cftab[i] > nblock) { + /* s->cftab[i] can legitimately be == nblock */ + RETURN(BZ_DATA_ERROR); + } + } + + s->state_out_len = 0; + s->state_out_ch = 0; + BZ_INITIALISE_CRC ( s->calculatedBlockCRC ); + s->state = BZ_X_OUTPUT; + if (s->verbosity >= 2) VPrintf0 ( "rt+rld" ); + + if (s->smallDecompress) { + + /*-- Make a copy of cftab, used in generation of T --*/ + for (i = 0; i <= 256; i++) s->cftabCopy[i] = s->cftab[i]; + + /*-- compute the T vector --*/ + for (i = 0; i < nblock; i++) { + uc = (UChar)(s->ll16[i]); + SET_LL(i, s->cftabCopy[uc]); + s->cftabCopy[uc]++; + } + + /*-- Compute T^(-1) by pointer reversal on T --*/ + i = s->origPtr; + j = GET_LL(i); + do { + Int32 tmp = GET_LL(j); + SET_LL(j, i); + i = j; + j = tmp; + } + while (i != s->origPtr); + + s->tPos = s->origPtr; + s->nblock_used = 0; + if (s->blockRandomised) { + BZ_RAND_INIT_MASK; + BZ_GET_SMALL(s->k0); s->nblock_used++; + BZ_RAND_UPD_MASK; s->k0 ^= BZ_RAND_MASK; + } else { + BZ_GET_SMALL(s->k0); s->nblock_used++; + } + + } else { + + /*-- compute the T^(-1) vector --*/ + for (i = 0; i < nblock; i++) { + uc = (UChar)(s->tt[i] & 0xff); + s->tt[s->cftab[uc]] |= (i << 8); + s->cftab[uc]++; + } + + s->tPos = s->tt[s->origPtr] >> 8; + s->nblock_used = 0; + if (s->blockRandomised) { + BZ_RAND_INIT_MASK; + BZ_GET_FAST(s->k0); s->nblock_used++; + BZ_RAND_UPD_MASK; s->k0 ^= BZ_RAND_MASK; + } else { + BZ_GET_FAST(s->k0); s->nblock_used++; + } + + } + + RETURN(BZ_OK); + + + + endhdr_2: + + GET_UCHAR(BZ_X_ENDHDR_2, uc); + if (uc != 0x72) RETURN(BZ_DATA_ERROR); + GET_UCHAR(BZ_X_ENDHDR_3, uc); + if (uc != 0x45) RETURN(BZ_DATA_ERROR); + GET_UCHAR(BZ_X_ENDHDR_4, uc); + if (uc != 0x38) RETURN(BZ_DATA_ERROR); + GET_UCHAR(BZ_X_ENDHDR_5, uc); + if (uc != 0x50) RETURN(BZ_DATA_ERROR); + GET_UCHAR(BZ_X_ENDHDR_6, uc); + if (uc != 0x90) RETURN(BZ_DATA_ERROR); + + s->storedCombinedCRC = 0; + GET_UCHAR(BZ_X_CCRC_1, uc); + s->storedCombinedCRC = (s->storedCombinedCRC << 8) | ((UInt32)uc); + GET_UCHAR(BZ_X_CCRC_2, uc); + s->storedCombinedCRC = (s->storedCombinedCRC << 8) | ((UInt32)uc); + GET_UCHAR(BZ_X_CCRC_3, uc); + s->storedCombinedCRC = (s->storedCombinedCRC << 8) | ((UInt32)uc); + GET_UCHAR(BZ_X_CCRC_4, uc); + s->storedCombinedCRC = (s->storedCombinedCRC << 8) | ((UInt32)uc); + + s->state = BZ_X_IDLE; + RETURN(BZ_STREAM_END); + + default: AssertH ( False, 4001 ); + } + + AssertH ( False, 4002 ); + + save_state_and_return: + + s->save_i = i; + s->save_j = j; + s->save_t = t; + s->save_alphaSize = alphaSize; + s->save_nGroups = nGroups; + s->save_nSelectors = nSelectors; + s->save_EOB = EOB; + s->save_groupNo = groupNo; + s->save_groupPos = groupPos; + s->save_nextSym = nextSym; + s->save_nblockMAX = nblockMAX; + s->save_nblock = nblock; + s->save_es = es; + s->save_N = N; + s->save_curr = curr; + s->save_zt = zt; + s->save_zn = zn; + s->save_zvec = zvec; + s->save_zj = zj; + s->save_gSel = gSel; + s->save_gMinlen = gMinlen; + s->save_gLimit = gLimit; + s->save_gBase = gBase; + s->save_gPerm = gPerm; + + return retVal; +} + + +/*-------------------------------------------------------------*/ +/*--- end decompress.c ---*/ +/*-------------------------------------------------------------*/ + +/*-------------------------------------------------------------*/ +/*--- Block sorting machinery ---*/ +/*--- blocksort.c ---*/ +/*-------------------------------------------------------------*/ + +/*-- + This file is a part of bzip2 and/or libbzip2, a program and + library for lossless, block-sorting data compression. + + Copyright (C) 1996-2004 Julian R Seward. All rights reserved. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions + are met: + + 1. Redistributions of source code must retain the above copyright + notice, this list of conditions and the following disclaimer. + + 2. The origin of this software must not be misrepresented; you must + not claim that you wrote the original software. If you use this + software in a product, an acknowledgment in the product + documentation would be appreciated but is not required. + + 3. Altered source versions must be plainly marked as such, and must + not be misrepresented as being the original software. + + 4. The name of the author may not be used to endorse or promote + products derived from this software without specific prior written + permission. + + THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS + OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED + WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY + DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE + GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS + INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, + WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING + NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS + SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + + Julian Seward, Cambridge, UK. + jseward@bzip.org + bzip2/libbzip2 version 1.0 of 21 March 2000 + + This program is based on (at least) the work of: + Mike Burrows + David Wheeler + Peter Fenwick + Alistair Moffat + Radford Neal + Ian H. Witten + Robert Sedgewick + Jon L. Bentley + + For more information on these sources, see the manual. + + To get some idea how the block sorting algorithms in this file + work, read my paper + On the Performance of BWT Sorting Algorithms + in Proceedings of the IEEE Data Compression Conference 2000, + Snowbird, Utah, USA, 27-30 March 2000. The main sort in this + file implements the algorithm called cache in the paper. +--*/ + + + +/*---------------------------------------------*/ +/*--- Fallback O(N log(N)^2) sorting ---*/ +/*--- algorithm, for repetitive blocks ---*/ +/*---------------------------------------------*/ + +/*---------------------------------------------*/ +static +__inline__ +void fallbackSimpleSort ( UInt32* fmap, + UInt32* eclass, + Int32 lo, + Int32 hi ) +{ + Int32 i, j, tmp; + UInt32 ec_tmp; + + if (lo == hi) return; + + if (hi - lo > 3) { + for ( i = hi-4; i >= lo; i-- ) { + tmp = fmap[i]; + ec_tmp = eclass[tmp]; + for ( j = i+4; j <= hi && ec_tmp > eclass[fmap[j]]; j += 4 ) + fmap[j-4] = fmap[j]; + fmap[j-4] = tmp; + } + } + + for ( i = hi-1; i >= lo; i-- ) { + tmp = fmap[i]; + ec_tmp = eclass[tmp]; + for ( j = i+1; j <= hi && ec_tmp > eclass[fmap[j]]; j++ ) + fmap[j-1] = fmap[j]; + fmap[j-1] = tmp; + } +} + + +/*---------------------------------------------*/ +#define fswap(zz1, zz2) \ + { Int32 zztmp = zz1; zz1 = zz2; zz2 = zztmp; } + +#define fvswap(zzp1, zzp2, zzn) \ +{ \ + Int32 yyp1 = (zzp1); \ + Int32 yyp2 = (zzp2); \ + Int32 yyn = (zzn); \ + while (yyn > 0) { \ + fswap(fmap[yyp1], fmap[yyp2]); \ + yyp1++; yyp2++; yyn--; \ + } \ +} + + +#define fmin(a,b) ((a) < (b)) ? (a) : (b) + +#define fpush(lz,hz) { stackLo[sp] = lz; \ + stackHi[sp] = hz; \ + sp++; } + +#define fpop(lz,hz) { sp--; \ + lz = stackLo[sp]; \ + hz = stackHi[sp]; } + +#define FALLBACK_QSORT_SMALL_THRESH 10 +#define FALLBACK_QSORT_STACK_SIZE 100 + + +static +void fallbackQSort3 ( UInt32* fmap, + UInt32* eclass, + Int32 loSt, + Int32 hiSt ) +{ + Int32 unLo, unHi, ltLo, gtHi, n, m; + Int32 sp, lo, hi; + UInt32 med, r, r3; + Int32 stackLo[FALLBACK_QSORT_STACK_SIZE]; + Int32 stackHi[FALLBACK_QSORT_STACK_SIZE]; + + r = 0; + + sp = 0; + fpush ( loSt, hiSt ); + + while (sp > 0) { + + AssertH ( sp < FALLBACK_QSORT_STACK_SIZE, 1004 ); + + fpop ( lo, hi ); + if (hi - lo < FALLBACK_QSORT_SMALL_THRESH) { + fallbackSimpleSort ( fmap, eclass, lo, hi ); + continue; + } + + /* Random partitioning. Median of 3 sometimes fails to + avoid bad cases. Median of 9 seems to help but + looks rather expensive. This too seems to work but + is cheaper. Guidance for the magic constants + 7621 and 32768 is taken from Sedgewick's algorithms + book, chapter 35. + */ + r = ((r * 7621) + 1) % 32768; + r3 = r % 3; + if (r3 == 0) med = eclass[fmap[lo]]; else + if (r3 == 1) med = eclass[fmap[(lo+hi)>>1]]; else + med = eclass[fmap[hi]]; + + unLo = ltLo = lo; + unHi = gtHi = hi; + + while (1) { + while (1) { + if (unLo > unHi) break; + n = (Int32)eclass[fmap[unLo]] - (Int32)med; + if (n == 0) { + fswap(fmap[unLo], fmap[ltLo]); + ltLo++; unLo++; + continue; + }; + if (n > 0) break; + unLo++; + } + while (1) { + if (unLo > unHi) break; + n = (Int32)eclass[fmap[unHi]] - (Int32)med; + if (n == 0) { + fswap(fmap[unHi], fmap[gtHi]); + gtHi--; unHi--; + continue; + }; + if (n < 0) break; + unHi--; + } + if (unLo > unHi) break; + fswap(fmap[unLo], fmap[unHi]); unLo++; unHi--; + } + + AssertD ( unHi == unLo-1, "fallbackQSort3(2)" ); + + if (gtHi < ltLo) continue; + + n = fmin(ltLo-lo, unLo-ltLo); fvswap(lo, unLo-n, n); + m = fmin(hi-gtHi, gtHi-unHi); fvswap(unLo, hi-m+1, m); + + n = lo + unLo - ltLo - 1; + m = hi - (gtHi - unHi) + 1; + + if (n - lo > hi - m) { + fpush ( lo, n ); + fpush ( m, hi ); + } else { + fpush ( m, hi ); + fpush ( lo, n ); + } + } +} + +#undef fmin +#undef fpush +#undef fpop +#undef fswap +#undef fvswap +#undef FALLBACK_QSORT_SMALL_THRESH +#undef FALLBACK_QSORT_STACK_SIZE + + +/*---------------------------------------------*/ +/* Pre: + nblock > 0 + eclass exists for [0 .. nblock-1] + ((UChar*)eclass) [0 .. nblock-1] holds block + ptr exists for [0 .. nblock-1] + + Post: + ((UChar*)eclass) [0 .. nblock-1] holds block + All other areas of eclass destroyed + fmap [0 .. nblock-1] holds sorted order + bhtab [ 0 .. 2+(nblock/32) ] destroyed +*/ + +#define SET_BH(zz) bhtab[(zz) >> 5] |= (1 << ((zz) & 31)) +#define CLEAR_BH(zz) bhtab[(zz) >> 5] &= ~(1 << ((zz) & 31)) +#define ISSET_BH(zz) (bhtab[(zz) >> 5] & (1 << ((zz) & 31))) +#define WORD_BH(zz) bhtab[(zz) >> 5] +#define UNALIGNED_BH(zz) ((zz) & 0x01f) + +static +void fallbackSort ( UInt32* fmap, + UInt32* eclass, + UInt32* bhtab, + Int32 nblock, + Int32 verb ) +{ + Int32 ftab[257]; + Int32 ftabCopy[256]; + Int32 H, i, j, k, l, r, cc, cc1; + Int32 nNotDone; + Int32 nBhtab; + UChar* eclass8 = (UChar*)eclass; + + /*-- + Initial 1-char radix sort to generate + initial fmap and initial BH bits. + --*/ + if (verb >= 4) + VPrintf0 ( " bucket sorting ...\n" ); + for (i = 0; i < 257; i++) ftab[i] = 0; + for (i = 0; i < nblock; i++) ftab[eclass8[i]]++; + for (i = 0; i < 256; i++) ftabCopy[i] = ftab[i]; + for (i = 1; i < 257; i++) ftab[i] += ftab[i-1]; + + for (i = 0; i < nblock; i++) { + j = eclass8[i]; + k = ftab[j] - 1; + ftab[j] = k; + fmap[k] = i; + } + + nBhtab = 2 + (nblock / 32); + for (i = 0; i < nBhtab; i++) bhtab[i] = 0; + for (i = 0; i < 256; i++) SET_BH(ftab[i]); + + /*-- + Inductively refine the buckets. Kind-of an + "exponential radix sort" (!), inspired by the + Manber-Myers suffix array construction algorithm. + --*/ + + /*-- set sentinel bits for block-end detection --*/ + for (i = 0; i < 32; i++) { + SET_BH(nblock + 2*i); + CLEAR_BH(nblock + 2*i + 1); + } + + /*-- the log(N) loop --*/ + H = 1; + while (1) { + + if (verb >= 4) + VPrintf1 ( " depth %6d has ", H ); + + j = 0; + for (i = 0; i < nblock; i++) { + if (ISSET_BH(i)) j = i; + k = fmap[i] - H; if (k < 0) k += nblock; + eclass[k] = j; + } + + nNotDone = 0; + r = -1; + while (1) { + + /*-- find the next non-singleton bucket --*/ + k = r + 1; + while (ISSET_BH(k) && UNALIGNED_BH(k)) k++; + if (ISSET_BH(k)) { + while (WORD_BH(k) == 0xffffffff) k += 32; + while (ISSET_BH(k)) k++; + } + l = k - 1; + if (l >= nblock) break; + while (!ISSET_BH(k) && UNALIGNED_BH(k)) k++; + if (!ISSET_BH(k)) { + while (WORD_BH(k) == 0x00000000) k += 32; + while (!ISSET_BH(k)) k++; + } + r = k - 1; + if (r >= nblock) break; + + /*-- now [l, r] bracket current bucket --*/ + if (r > l) { + nNotDone += (r - l + 1); + fallbackQSort3 ( fmap, eclass, l, r ); + + /*-- scan bucket and generate header bits-- */ + cc = -1; + for (i = l; i <= r; i++) { + cc1 = eclass[fmap[i]]; + if (cc != cc1) { SET_BH(i); cc = cc1; }; + } + } + } + + if (verb >= 4) + VPrintf1 ( "%6d unresolved strings\n", nNotDone ); + + H *= 2; + if (H > nblock || nNotDone == 0) break; + } + + /*-- + Reconstruct the original block in + eclass8 [0 .. nblock-1], since the + previous phase destroyed it. + --*/ + if (verb >= 4) + VPrintf0 ( " reconstructing block ...\n" ); + j = 0; + for (i = 0; i < nblock; i++) { + while (ftabCopy[j] == 0) j++; + ftabCopy[j]--; + eclass8[fmap[i]] = (UChar)j; + } + AssertH ( j < 256, 1005 ); +} + +#undef SET_BH +#undef CLEAR_BH +#undef ISSET_BH +#undef WORD_BH +#undef UNALIGNED_BH + + +/*---------------------------------------------*/ +/*--- The main, O(N^2 log(N)) sorting ---*/ +/*--- algorithm. Faster for "normal" ---*/ +/*--- non-repetitive blocks. ---*/ +/*---------------------------------------------*/ + +/*---------------------------------------------*/ +static +__inline__ +Bool mainGtU ( UInt32 i1, + UInt32 i2, + UChar* block, + UInt16* quadrant, + UInt32 nblock, + Int32* budget ) +{ + Int32 k; + UChar c1, c2; + UInt16 s1, s2; + + AssertD ( i1 != i2, "mainGtU" ); + /* 1 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + /* 2 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + /* 3 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + /* 4 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + /* 5 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + /* 6 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + /* 7 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + /* 8 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + /* 9 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + /* 10 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + /* 11 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + /* 12 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + i1++; i2++; + + k = nblock + 8; + + do { + /* 1 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + s1 = quadrant[i1]; s2 = quadrant[i2]; + if (s1 != s2) return (s1 > s2); + i1++; i2++; + /* 2 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + s1 = quadrant[i1]; s2 = quadrant[i2]; + if (s1 != s2) return (s1 > s2); + i1++; i2++; + /* 3 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + s1 = quadrant[i1]; s2 = quadrant[i2]; + if (s1 != s2) return (s1 > s2); + i1++; i2++; + /* 4 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + s1 = quadrant[i1]; s2 = quadrant[i2]; + if (s1 != s2) return (s1 > s2); + i1++; i2++; + /* 5 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + s1 = quadrant[i1]; s2 = quadrant[i2]; + if (s1 != s2) return (s1 > s2); + i1++; i2++; + /* 6 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + s1 = quadrant[i1]; s2 = quadrant[i2]; + if (s1 != s2) return (s1 > s2); + i1++; i2++; + /* 7 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + s1 = quadrant[i1]; s2 = quadrant[i2]; + if (s1 != s2) return (s1 > s2); + i1++; i2++; + /* 8 */ + c1 = block[i1]; c2 = block[i2]; + if (c1 != c2) return (c1 > c2); + s1 = quadrant[i1]; s2 = quadrant[i2]; + if (s1 != s2) return (s1 > s2); + i1++; i2++; + + if (i1 >= nblock) i1 -= nblock; + if (i2 >= nblock) i2 -= nblock; + + k -= 8; + (*budget)--; + } + while (k >= 0); + + return False; +} + + +/*---------------------------------------------*/ +/*-- + Knuth's increments seem to work better + than Incerpi-Sedgewick here. Possibly + because the number of elems to sort is + usually small, typically <= 20. +--*/ +static +Int32 incs[14] = { 1, 4, 13, 40, 121, 364, 1093, 3280, + 9841, 29524, 88573, 265720, + 797161, 2391484 }; + +static +void mainSimpleSort ( UInt32* ptr, + UChar* block, + UInt16* quadrant, + Int32 nblock, + Int32 lo, + Int32 hi, + Int32 d, + Int32* budget ) +{ + Int32 i, j, h, bigN, hp; + UInt32 v; + + bigN = hi - lo + 1; + if (bigN < 2) return; + + hp = 0; + while (incs[hp] < bigN) hp++; + hp--; + + for (; hp >= 0; hp--) { + h = incs[hp]; + + i = lo + h; + while (True) { + + /*-- copy 1 --*/ + if (i > hi) break; + v = ptr[i]; + j = i; + while ( mainGtU ( + ptr[j-h]+d, v+d, block, quadrant, nblock, budget + ) ) { + ptr[j] = ptr[j-h]; + j = j - h; + if (j <= (lo + h - 1)) break; + } + ptr[j] = v; + i++; + + /*-- copy 2 --*/ + if (i > hi) break; + v = ptr[i]; + j = i; + while ( mainGtU ( + ptr[j-h]+d, v+d, block, quadrant, nblock, budget + ) ) { + ptr[j] = ptr[j-h]; + j = j - h; + if (j <= (lo + h - 1)) break; + } + ptr[j] = v; + i++; + + /*-- copy 3 --*/ + if (i > hi) break; + v = ptr[i]; + j = i; + while ( mainGtU ( + ptr[j-h]+d, v+d, block, quadrant, nblock, budget + ) ) { + ptr[j] = ptr[j-h]; + j = j - h; + if (j <= (lo + h - 1)) break; + } + ptr[j] = v; + i++; + + if (*budget < 0) return; + } + } +} + + +/*---------------------------------------------*/ +/*-- + The following is an implementation of + an elegant 3-way quicksort for strings, + described in a paper "Fast Algorithms for + Sorting and Searching Strings", by Robert + Sedgewick and Jon L. Bentley. +--*/ + +#define mswap(zz1, zz2) \ + { Int32 zztmp = zz1; zz1 = zz2; zz2 = zztmp; } + +#define mvswap(zzp1, zzp2, zzn) \ +{ \ + Int32 yyp1 = (zzp1); \ + Int32 yyp2 = (zzp2); \ + Int32 yyn = (zzn); \ + while (yyn > 0) { \ + mswap(ptr[yyp1], ptr[yyp2]); \ + yyp1++; yyp2++; yyn--; \ + } \ +} + +static +__inline__ +UChar mmed3 ( UChar a, UChar b, UChar c ) +{ + UChar t; + if (a > b) { t = a; a = b; b = t; }; + if (b > c) { + b = c; + if (a > b) b = a; + } + return b; +} + +#define mmin(a,b) ((a) < (b)) ? (a) : (b) + +#define mpush(lz,hz,dz) { stackLo[sp] = lz; \ + stackHi[sp] = hz; \ + stackD [sp] = dz; \ + sp++; } + +#define mpop(lz,hz,dz) { sp--; \ + lz = stackLo[sp]; \ + hz = stackHi[sp]; \ + dz = stackD [sp]; } + + +#define mnextsize(az) (nextHi[az]-nextLo[az]) + +#define mnextswap(az,bz) \ + { Int32 tz; \ + tz = nextLo[az]; nextLo[az] = nextLo[bz]; nextLo[bz] = tz; \ + tz = nextHi[az]; nextHi[az] = nextHi[bz]; nextHi[bz] = tz; \ + tz = nextD [az]; nextD [az] = nextD [bz]; nextD [bz] = tz; } + + +#define MAIN_QSORT_SMALL_THRESH 20 +#define MAIN_QSORT_DEPTH_THRESH (BZ_N_RADIX + BZ_N_QSORT) +#define MAIN_QSORT_STACK_SIZE 100 + +static +void mainQSort3 ( UInt32* ptr, + UChar* block, + UInt16* quadrant, + Int32 nblock, + Int32 loSt, + Int32 hiSt, + Int32 dSt, + Int32* budget ) +{ + Int32 unLo, unHi, ltLo, gtHi, n, m, med; + Int32 sp, lo, hi, d; + + Int32 stackLo[MAIN_QSORT_STACK_SIZE]; + Int32 stackHi[MAIN_QSORT_STACK_SIZE]; + Int32 stackD [MAIN_QSORT_STACK_SIZE]; + + Int32 nextLo[3]; + Int32 nextHi[3]; + Int32 nextD [3]; + + sp = 0; + mpush ( loSt, hiSt, dSt ); + + while (sp > 0) { + + AssertH ( sp < MAIN_QSORT_STACK_SIZE, 1001 ); + + mpop ( lo, hi, d ); + if (hi - lo < MAIN_QSORT_SMALL_THRESH || + d > MAIN_QSORT_DEPTH_THRESH) { + mainSimpleSort ( ptr, block, quadrant, nblock, lo, hi, d, budget ); + if (*budget < 0) return; + continue; + } + + med = (Int32) + mmed3 ( block[ptr[ lo ]+d], + block[ptr[ hi ]+d], + block[ptr[ (lo+hi)>>1 ]+d] ); + + unLo = ltLo = lo; + unHi = gtHi = hi; + + while (True) { + while (True) { + if (unLo > unHi) break; + n = ((Int32)block[ptr[unLo]+d]) - med; + if (n == 0) { + mswap(ptr[unLo], ptr[ltLo]); + ltLo++; unLo++; continue; + }; + if (n > 0) break; + unLo++; + } + while (True) { + if (unLo > unHi) break; + n = ((Int32)block[ptr[unHi]+d]) - med; + if (n == 0) { + mswap(ptr[unHi], ptr[gtHi]); + gtHi--; unHi--; continue; + }; + if (n < 0) break; + unHi--; + } + if (unLo > unHi) break; + mswap(ptr[unLo], ptr[unHi]); unLo++; unHi--; + } + + AssertD ( unHi == unLo-1, "mainQSort3(2)" ); + + if (gtHi < ltLo) { + mpush(lo, hi, d+1 ); + continue; + } + + n = mmin(ltLo-lo, unLo-ltLo); mvswap(lo, unLo-n, n); + m = mmin(hi-gtHi, gtHi-unHi); mvswap(unLo, hi-m+1, m); + + n = lo + unLo - ltLo - 1; + m = hi - (gtHi - unHi) + 1; + + nextLo[0] = lo; nextHi[0] = n; nextD[0] = d; + nextLo[1] = m; nextHi[1] = hi; nextD[1] = d; + nextLo[2] = n+1; nextHi[2] = m-1; nextD[2] = d+1; + + if (mnextsize(0) < mnextsize(1)) mnextswap(0,1); + if (mnextsize(1) < mnextsize(2)) mnextswap(1,2); + if (mnextsize(0) < mnextsize(1)) mnextswap(0,1); + + AssertD (mnextsize(0) >= mnextsize(1), "mainQSort3(8)" ); + AssertD (mnextsize(1) >= mnextsize(2), "mainQSort3(9)" ); + + mpush (nextLo[0], nextHi[0], nextD[0]); + mpush (nextLo[1], nextHi[1], nextD[1]); + mpush (nextLo[2], nextHi[2], nextD[2]); + } +} + +#undef mswap +#undef mvswap +#undef mpush +#undef mpop +#undef mmin +#undef mnextsize +#undef mnextswap +#undef MAIN_QSORT_SMALL_THRESH +#undef MAIN_QSORT_DEPTH_THRESH +#undef MAIN_QSORT_STACK_SIZE + + +/*---------------------------------------------*/ +/* Pre: + nblock > N_OVERSHOOT + block32 exists for [0 .. nblock-1 +N_OVERSHOOT] + ((UChar*)block32) [0 .. nblock-1] holds block + ptr exists for [0 .. nblock-1] + + Post: + ((UChar*)block32) [0 .. nblock-1] holds block + All other areas of block32 destroyed + ftab [0 .. 65536 ] destroyed + ptr [0 .. nblock-1] holds sorted order + if (*budget < 0), sorting was abandoned +*/ + +#define BIGFREQ(b) (ftab[((b)+1) << 8] - ftab[(b) << 8]) +#define SETMASK (1 << 21) +#define CLEARMASK (~(SETMASK)) + +static +void mainSort ( UInt32* ptr, + UChar* block, + UInt16* quadrant, + UInt32* ftab, + Int32 nblock, + Int32 verb, + Int32* budget ) +{ + Int32 i, j, k, ss, sb; + Int32 runningOrder[256]; + Bool bigDone[256]; + Int32 copyStart[256]; + Int32 copyEnd [256]; + UChar c1; + Int32 numQSorted; + UInt16 s; + if (verb >= 4) VPrintf0 ( " main sort initialise ...\n" ); + + /*-- set up the 2-byte frequency table --*/ + for (i = 65536; i >= 0; i--) ftab[i] = 0; + + j = block[0] << 8; + i = nblock-1; + for (; i >= 3; i -= 4) { + quadrant[i] = 0; + j = (j >> 8) | ( ((UInt16)block[i]) << 8); + ftab[j]++; + quadrant[i-1] = 0; + j = (j >> 8) | ( ((UInt16)block[i-1]) << 8); + ftab[j]++; + quadrant[i-2] = 0; + j = (j >> 8) | ( ((UInt16)block[i-2]) << 8); + ftab[j]++; + quadrant[i-3] = 0; + j = (j >> 8) | ( ((UInt16)block[i-3]) << 8); + ftab[j]++; + } + for (; i >= 0; i--) { + quadrant[i] = 0; + j = (j >> 8) | ( ((UInt16)block[i]) << 8); + ftab[j]++; + } + + /*-- (emphasises close relationship of block & quadrant) --*/ + for (i = 0; i < BZ_N_OVERSHOOT; i++) { + block [nblock+i] = block[i]; + quadrant[nblock+i] = 0; + } + + if (verb >= 4) VPrintf0 ( " bucket sorting ...\n" ); + + /*-- Complete the initial radix sort --*/ + for (i = 1; i <= 65536; i++) ftab[i] += ftab[i-1]; + + s = block[0] << 8; + i = nblock-1; + for (; i >= 3; i -= 4) { + s = (s >> 8) | (block[i] << 8); + j = ftab[s] -1; + ftab[s] = j; + ptr[j] = i; + s = (s >> 8) | (block[i-1] << 8); + j = ftab[s] -1; + ftab[s] = j; + ptr[j] = i-1; + s = (s >> 8) | (block[i-2] << 8); + j = ftab[s] -1; + ftab[s] = j; + ptr[j] = i-2; + s = (s >> 8) | (block[i-3] << 8); + j = ftab[s] -1; + ftab[s] = j; + ptr[j] = i-3; + } + for (; i >= 0; i--) { + s = (s >> 8) | (block[i] << 8); + j = ftab[s] -1; + ftab[s] = j; + ptr[j] = i; + } + + /*-- + Now ftab contains the first loc of every small bucket. + Calculate the running order, from smallest to largest + big bucket. + --*/ + for (i = 0; i <= 255; i++) { + bigDone [i] = False; + runningOrder[i] = i; + } + + { + Int32 vv; + Int32 h = 1; + do h = 3 * h + 1; while (h <= 256); + do { + h = h / 3; + for (i = h; i <= 255; i++) { + vv = runningOrder[i]; + j = i; + while ( BIGFREQ(runningOrder[j-h]) > BIGFREQ(vv) ) { + runningOrder[j] = runningOrder[j-h]; + j = j - h; + if (j <= (h - 1)) goto zero; + } + zero: + runningOrder[j] = vv; + } + } while (h != 1); + } + + /*-- + The main sorting loop. + --*/ + + numQSorted = 0; + + for (i = 0; i <= 255; i++) { + + /*-- + Process big buckets, starting with the least full. + Basically this is a 3-step process in which we call + mainQSort3 to sort the small buckets [ss, j], but + also make a big effort to avoid the calls if we can. + --*/ + ss = runningOrder[i]; + + /*-- + Step 1: + Complete the big bucket [ss] by quicksorting + any unsorted small buckets [ss, j], for j != ss. + Hopefully previous pointer-scanning phases have already + completed many of the small buckets [ss, j], so + we don't have to sort them at all. + --*/ + for (j = 0; j <= 255; j++) { + if (j != ss) { + sb = (ss << 8) + j; + if ( ! (ftab[sb] & SETMASK) ) { + Int32 lo = ftab[sb] & CLEARMASK; + Int32 hi = (ftab[sb+1] & CLEARMASK) - 1; + if (hi > lo) { + if (verb >= 4) + VPrintf4 ( " qsort [0x%x, 0x%x] " + "done %d this %d\n", + ss, j, numQSorted, hi - lo + 1 ); + mainQSort3 ( + ptr, block, quadrant, nblock, + lo, hi, BZ_N_RADIX, budget + ); + numQSorted += (hi - lo + 1); + if (*budget < 0) return; + } + } + ftab[sb] |= SETMASK; + } + } + + AssertH ( !bigDone[ss], 1006 ); + + /*-- + Step 2: + Now scan this big bucket [ss] so as to synthesise the + sorted order for small buckets [t, ss] for all t, + including, magically, the bucket [ss,ss] too. + This will avoid doing Real Work in subsequent Step 1's. + --*/ + { + for (j = 0; j <= 255; j++) { + copyStart[j] = ftab[(j << 8) + ss] & CLEARMASK; + copyEnd [j] = (ftab[(j << 8) + ss + 1] & CLEARMASK) - 1; + } + for (j = ftab[ss << 8] & CLEARMASK; j < copyStart[ss]; j++) { + k = ptr[j]-1; if (k < 0) k += nblock; + c1 = block[k]; + if (!bigDone[c1]) + ptr[ copyStart[c1]++ ] = k; + } + for (j = (ftab[(ss+1) << 8] & CLEARMASK) - 1; j > copyEnd[ss]; j--) { + k = ptr[j]-1; if (k < 0) k += nblock; + c1 = block[k]; + if (!bigDone[c1]) + ptr[ copyEnd[c1]-- ] = k; + } + } + + AssertH ( (copyStart[ss]-1 == copyEnd[ss]) + || + /* Extremely rare case missing in bzip2-1.0.0 and 1.0.1. + Necessity for this case is demonstrated by compressing + a sequence of approximately 48.5 million of character + 251; 1.0.0/1.0.1 will then die here. */ + (copyStart[ss] == 0 && copyEnd[ss] == nblock-1), + 1007 ) + + for (j = 0; j <= 255; j++) ftab[(j << 8) + ss] |= SETMASK; + + /*-- + Step 3: + The [ss] big bucket is now done. Record this fact, + and update the quadrant descriptors. Remember to + update quadrants in the overshoot area too, if + necessary. The "if (i < 255)" test merely skips + this updating for the last bucket processed, since + updating for the last bucket is pointless. + + The quadrant array provides a way to incrementally + cache sort orderings, as they appear, so as to + make subsequent comparisons in fullGtU() complete + faster. For repetitive blocks this makes a big + difference (but not big enough to be able to avoid + the fallback sorting mechanism, exponential radix sort). + + The precise meaning is: at all times: + + for 0 <= i < nblock and 0 <= j <= nblock + + if block[i] != block[j], + + then the relative values of quadrant[i] and + quadrant[j] are meaningless. + + else { + if quadrant[i] < quadrant[j] + then the string starting at i lexicographically + precedes the string starting at j + + else if quadrant[i] > quadrant[j] + then the string starting at j lexicographically + precedes the string starting at i + + else + the relative ordering of the strings starting + at i and j has not yet been determined. + } + --*/ + bigDone[ss] = True; + + if (i < 255) { + Int32 bbStart = ftab[ss << 8] & CLEARMASK; + Int32 bbSize = (ftab[(ss+1) << 8] & CLEARMASK) - bbStart; + Int32 shifts = 0; + + while ((bbSize >> shifts) > 65534) shifts++; + + for (j = bbSize-1; j >= 0; j--) { + Int32 a2update = ptr[bbStart + j]; + UInt16 qVal = (UInt16)(j >> shifts); + quadrant[a2update] = qVal; + if (a2update < BZ_N_OVERSHOOT) + quadrant[a2update + nblock] = qVal; + } + AssertH ( ((bbSize-1) >> shifts) <= 65535, 1002 ); + } + + } + + if (verb >= 4) + VPrintf3 ( " %d pointers, %d sorted, %d scanned\n", + nblock, numQSorted, nblock - numQSorted ); +} + +#undef BIGFREQ +#undef SETMASK +#undef CLEARMASK + + +/*---------------------------------------------*/ +/* Pre: + nblock > 0 + arr2 exists for [0 .. nblock-1 +N_OVERSHOOT] + ((UChar*)arr2) [0 .. nblock-1] holds block + arr1 exists for [0 .. nblock-1] + + Post: + ((UChar*)arr2) [0 .. nblock-1] holds block + All other areas of block destroyed + ftab [ 0 .. 65536 ] destroyed + arr1 [0 .. nblock-1] holds sorted order +*/ +void BZ2_blockSort ( EState* s ) +{ + UInt32* ptr = s->ptr; + UChar* block = s->block; + UInt32* ftab = s->ftab; + Int32 nblock = s->nblock; + Int32 verb = s->verbosity; + Int32 wfact = s->workFactor; + UInt16* quadrant; + Int32 budget; + Int32 budgetInit; + Int32 i; + + if (nblock < /* 10000 */1000 ) { + fallbackSort ( s->arr1, s->arr2, ftab, nblock, verb ); + } else { + /* Calculate the location for quadrant, remembering to get + the alignment right. Assumes that &(block[0]) is at least + 2-byte aligned -- this should be ok since block is really + the first section of arr2. + */ + i = nblock+BZ_N_OVERSHOOT; + if (i & 1) i++; + quadrant = (UInt16*)(&(block[i])); + + /* (wfact-1) / 3 puts the default-factor-30 + transition point at very roughly the same place as + with v0.1 and v0.9.0. + Not that it particularly matters any more, since the + resulting compressed stream is now the same regardless + of whether or not we use the main sort or fallback sort. + */ + if (wfact < 1 ) wfact = 1; + if (wfact > 100) wfact = 100; + budgetInit = nblock * ((wfact-1) / 3); + budget = budgetInit; + + mainSort ( ptr, block, quadrant, ftab, nblock, verb, &budget ); + if (0 && verb >= 3) + VPrintf3 ( " %d work, %d block, ratio %5.2f\n", + budgetInit - budget, + nblock, + (float)(budgetInit - budget) / + (float)(nblock==0 ? 1 : nblock) ); + if (budget < 0) { + if (verb >= 2) + VPrintf0 ( " too repetitive; using fallback" + " sorting algorithm\n" ); + fallbackSort ( s->arr1, s->arr2, ftab, nblock, verb ); + } + } + + s->origPtr = -1; + for (i = 0; i < s->nblock; i++) + if (ptr[i] == 0) + { s->origPtr = i; break; }; + + AssertH( s->origPtr != -1, 1003 ); +} + + +/*-------------------------------------------------------------*/ +/*--- end blocksort.c ---*/ +/*-------------------------------------------------------------*/ + +/*-------------------------------------------------------------*/ +/*--- Huffman coding low-level stuff ---*/ +/*--- huffman.c ---*/ +/*-------------------------------------------------------------*/ + +/*-- + This file is a part of bzip2 and/or libbzip2, a program and + library for lossless, block-sorting data compression. + + Copyright (C) 1996-2004 Julian R Seward. All rights reserved. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions + are met: + + 1. Redistributions of source code must retain the above copyright + notice, this list of conditions and the following disclaimer. + + 2. The origin of this software must not be misrepresented; you must + not claim that you wrote the original software. If you use this + software in a product, an acknowledgment in the product + documentation would be appreciated but is not required. + + 3. Altered source versions must be plainly marked as such, and must + not be misrepresented as being the original software. + + 4. The name of the author may not be used to endorse or promote + products derived from this software without specific prior written + permission. + + THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS + OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED + WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY + DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE + GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS + INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, + WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING + NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS + SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + + Julian Seward, Cambridge, UK. + jseward@bzip.org + bzip2/libbzip2 version 1.0 of 21 March 2000 + + This program is based on (at least) the work of: + Mike Burrows + David Wheeler + Peter Fenwick + Alistair Moffat + Radford Neal + Ian H. Witten + Robert Sedgewick + Jon L. Bentley + + For more information on these sources, see the manual. +--*/ + + + +/*---------------------------------------------------*/ +#define WEIGHTOF(zz0) ((zz0) & 0xffffff00) +#define DEPTHOF(zz1) ((zz1) & 0x000000ff) +#define MYMAX(zz2,zz3) ((zz2) > (zz3) ? (zz2) : (zz3)) + +#define ADDWEIGHTS(zw1,zw2) \ + (WEIGHTOF(zw1)+WEIGHTOF(zw2)) | \ + (1 + MYMAX(DEPTHOF(zw1),DEPTHOF(zw2))) + +#define UPHEAP(z) \ +{ \ + Int32 zz, tmp; \ + zz = z; tmp = heap[zz]; \ + while (weight[tmp] < weight[heap[zz >> 1]]) { \ + heap[zz] = heap[zz >> 1]; \ + zz >>= 1; \ + } \ + heap[zz] = tmp; \ +} + +#define DOWNHEAP(z) \ +{ \ + Int32 zz, yy, tmp; \ + zz = z; tmp = heap[zz]; \ + while (True) { \ + yy = zz << 1; \ + if (yy > nHeap) break; \ + if (yy < nHeap && \ + weight[heap[yy+1]] < weight[heap[yy]]) \ + yy++; \ + if (weight[tmp] < weight[heap[yy]]) break; \ + heap[zz] = heap[yy]; \ + zz = yy; \ + } \ + heap[zz] = tmp; \ +} + + +/*---------------------------------------------------*/ +void BZ2_hbMakeCodeLengths ( UChar *len, + Int32 *freq, + Int32 alphaSize, + Int32 maxLen ) +{ + /*-- + Nodes and heap entries run from 1. Entry 0 + for both the heap and nodes is a sentinel. + --*/ + Int32 nNodes, nHeap, n1, n2, i, j, k; + Bool tooLong; + + Int32 heap [ BZ_MAX_ALPHA_SIZE + 2 ]; + Int32 weight [ BZ_MAX_ALPHA_SIZE * 2 ]; + Int32 parent [ BZ_MAX_ALPHA_SIZE * 2 ]; + + for (i = 0; i < alphaSize; i++) + weight[i+1] = (freq[i] == 0 ? 1 : freq[i]) << 8; + + while (True) { + + nNodes = alphaSize; + nHeap = 0; + + heap[0] = 0; + weight[0] = 0; + parent[0] = -2; + + for (i = 1; i <= alphaSize; i++) { + parent[i] = -1; + nHeap++; + heap[nHeap] = i; + UPHEAP(nHeap); + } + + AssertH( nHeap < (BZ_MAX_ALPHA_SIZE+2), 2001 ); + + while (nHeap > 1) { + n1 = heap[1]; heap[1] = heap[nHeap]; nHeap--; DOWNHEAP(1); + n2 = heap[1]; heap[1] = heap[nHeap]; nHeap--; DOWNHEAP(1); + nNodes++; + parent[n1] = parent[n2] = nNodes; + weight[nNodes] = ADDWEIGHTS(weight[n1], weight[n2]); + parent[nNodes] = -1; + nHeap++; + heap[nHeap] = nNodes; + UPHEAP(nHeap); + } + + AssertH( nNodes < (BZ_MAX_ALPHA_SIZE * 2), 2002 ); + + tooLong = False; + for (i = 1; i <= alphaSize; i++) { + j = 0; + k = i; + while (parent[k] >= 0) { k = parent[k]; j++; } + len[i-1] = j; + if (j > maxLen) tooLong = True; + } + + if (! tooLong) break; + + /* 17 Oct 04: keep-going condition for the following loop used + to be 'i < alphaSize', which missed the last element, + theoretically leading to the possibility of the compressor + looping. However, this count-scaling step is only needed if + one of the generated Huffman code words is longer than + maxLen, which up to and including version 1.0.2 was 20 bits, + which is extremely unlikely. In version 1.0.3 maxLen was + changed to 17 bits, which has minimal effect on compression + ratio, but does mean this scaling step is used from time to + time, enough to verify that it works. + + This means that bzip2-1.0.3 and later will only produce + Huffman codes with a maximum length of 17 bits. However, in + order to preserve backwards compatibility with bitstreams + produced by versions pre-1.0.3, the decompressor must still + handle lengths of up to 20. */ + + for (i = 1; i <= alphaSize; i++) { + j = weight[i] >> 8; + j = 1 + (j / 2); + weight[i] = j << 8; + } + } +} + + +/*---------------------------------------------------*/ +void BZ2_hbAssignCodes ( Int32 *code, + UChar *length, + Int32 minLen, + Int32 maxLen, + Int32 alphaSize ) +{ + Int32 n, vec, i; + + vec = 0; + for (n = minLen; n <= maxLen; n++) { + for (i = 0; i < alphaSize; i++) + if (length[i] == n) { code[i] = vec; vec++; }; + vec <<= 1; + } +} + + +/*---------------------------------------------------*/ +void BZ2_hbCreateDecodeTables ( Int32 *limit, + Int32 *base, + Int32 *perm, + UChar *length, + Int32 minLen, + Int32 maxLen, + Int32 alphaSize ) +{ + Int32 pp, i, j, vec; + + pp = 0; + for (i = minLen; i <= maxLen; i++) + for (j = 0; j < alphaSize; j++) + if (length[j] == i) { perm[pp] = j; pp++; }; + + for (i = 0; i < BZ_MAX_CODE_LEN; i++) base[i] = 0; + for (i = 0; i < alphaSize; i++) base[length[i]+1]++; + + for (i = 1; i < BZ_MAX_CODE_LEN; i++) base[i] += base[i-1]; + + for (i = 0; i < BZ_MAX_CODE_LEN; i++) limit[i] = 0; + vec = 0; + + for (i = minLen; i <= maxLen; i++) { + vec += (base[i+1] - base[i]); + limit[i] = vec-1; + vec <<= 1; + } + for (i = minLen + 1; i <= maxLen; i++) + base[i] = ((limit[i-1] + 1) << 1) - base[i]; +} + + +/*-------------------------------------------------------------*/ +/*--- end huffman.c ---*/ +/*-------------------------------------------------------------*/ + +/*-------------------------------------------------------------*/ +/*--- Compression machinery (not incl block sorting) ---*/ +/*--- compress.c ---*/ +/*-------------------------------------------------------------*/ + +/*-- + This file is a part of bzip2 and/or libbzip2, a program and + library for lossless, block-sorting data compression. + + Copyright (C) 1996-2004 Julian R Seward. All rights reserved. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions + are met: + + 1. Redistributions of source code must retain the above copyright + notice, this list of conditions and the following disclaimer. + + 2. The origin of this software must not be misrepresented; you must + not claim that you wrote the original software. If you use this + software in a product, an acknowledgment in the product + documentation would be appreciated but is not required. + + 3. Altered source versions must be plainly marked as such, and must + not be misrepresented as being the original software. + + 4. The name of the author may not be used to endorse or promote + products derived from this software without specific prior written + permission. + + THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS + OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED + WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY + DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE + GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS + INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, + WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING + NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS + SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + + Julian Seward, Cambridge, UK. + jseward@bzip.org + bzip2/libbzip2 version 1.0 of 21 March 2000 + + This program is based on (at least) the work of: + Mike Burrows + David Wheeler + Peter Fenwick + Alistair Moffat + Radford Neal + Ian H. Witten + Robert Sedgewick + Jon L. Bentley + + For more information on these sources, see the manual. +--*/ + +/*-- + CHANGES + ~~~~~~~ + 0.9.0 -- original version. + + 0.9.0a/b -- no changes in this file. + + 0.9.0c + * changed setting of nGroups in sendMTFValues() so as to + do a bit better on small files +--*/ + + + +/*---------------------------------------------------*/ +/*--- Bit stream I/O ---*/ +/*---------------------------------------------------*/ + +/*---------------------------------------------------*/ +void BZ2_bsInitWrite ( EState* s ) +{ + s->bsLive = 0; + s->bsBuff = 0; +} + + +/*---------------------------------------------------*/ +static +void bsFinishWrite ( EState* s ) +{ + while (s->bsLive > 0) { + s->zbits[s->numZ] = (UChar)(s->bsBuff >> 24); + s->numZ++; + s->bsBuff <<= 8; + s->bsLive -= 8; + } +} + + +/*---------------------------------------------------*/ +#define bsNEEDW(nz) \ +{ \ + while (s->bsLive >= 8) { \ + s->zbits[s->numZ] \ + = (UChar)(s->bsBuff >> 24); \ + s->numZ++; \ + s->bsBuff <<= 8; \ + s->bsLive -= 8; \ + } \ +} + + +/*---------------------------------------------------*/ +static +__inline__ +void bsW ( EState* s, Int32 n, UInt32 v ) +{ + bsNEEDW ( n ); + s->bsBuff |= (v << (32 - s->bsLive - n)); + s->bsLive += n; +} + + +/*---------------------------------------------------*/ +static +void bsPutUInt32 ( EState* s, UInt32 u ) +{ + bsW ( s, 8, (u >> 24) & 0xffL ); + bsW ( s, 8, (u >> 16) & 0xffL ); + bsW ( s, 8, (u >> 8) & 0xffL ); + bsW ( s, 8, u & 0xffL ); +} + + +/*---------------------------------------------------*/ +static +void bsPutUChar ( EState* s, UChar c ) +{ + bsW( s, 8, (UInt32)c ); +} + + +/*---------------------------------------------------*/ +/*--- The back end proper ---*/ +/*---------------------------------------------------*/ + +/*---------------------------------------------------*/ +static +void makeMaps_e ( EState* s ) +{ + Int32 i; + s->nInUse = 0; + for (i = 0; i < 256; i++) + if (s->inUse[i]) { + s->unseqToSeq[i] = s->nInUse; + s->nInUse++; + } +} + + +/*---------------------------------------------------*/ +static +void generateMTFValues ( EState* s ) +{ + UChar yy[256]; + Int32 i, j; + Int32 zPend; + Int32 wr; + Int32 EOB; + + /* + After sorting (eg, here), + s->arr1 [ 0 .. s->nblock-1 ] holds sorted order, + and + ((UChar*)s->arr2) [ 0 .. s->nblock-1 ] + holds the original block data. + + The first thing to do is generate the MTF values, + and put them in + ((UInt16*)s->arr1) [ 0 .. s->nblock-1 ]. + Because there are strictly fewer or equal MTF values + than block values, ptr values in this area are overwritten + with MTF values only when they are no longer needed. + + The final compressed bitstream is generated into the + area starting at + (UChar*) (&((UChar*)s->arr2)[s->nblock]) + + These storage aliases are set up in bzCompressInit(), + except for the last one, which is arranged in + compressBlock(). + */ + UInt32* ptr = s->ptr; + UChar* block = s->block; + UInt16* mtfv = s->mtfv; + + makeMaps_e ( s ); + EOB = s->nInUse+1; + + for (i = 0; i <= EOB; i++) s->mtfFreq[i] = 0; + + wr = 0; + zPend = 0; + for (i = 0; i < s->nInUse; i++) yy[i] = (UChar) i; + + for (i = 0; i < s->nblock; i++) { + UChar ll_i; + AssertD ( wr <= i, "generateMTFValues(1)" ); + j = ptr[i]-1; if (j < 0) j += s->nblock; + ll_i = s->unseqToSeq[block[j]]; + AssertD ( ll_i < s->nInUse, "generateMTFValues(2a)" ); + + if (yy[0] == ll_i) { + zPend++; + } else { + + if (zPend > 0) { + zPend--; + while (True) { + if (zPend & 1) { + mtfv[wr] = BZ_RUNB; wr++; + s->mtfFreq[BZ_RUNB]++; + } else { + mtfv[wr] = BZ_RUNA; wr++; + s->mtfFreq[BZ_RUNA]++; + } + if (zPend < 2) break; + zPend = (zPend - 2) / 2; + }; + zPend = 0; + } + { + register UChar rtmp; + register UChar* ryy_j; + register UChar rll_i; + rtmp = yy[1]; + yy[1] = yy[0]; + ryy_j = &(yy[1]); + rll_i = ll_i; + while ( rll_i != rtmp ) { + register UChar rtmp2; + ryy_j++; + rtmp2 = rtmp; + rtmp = *ryy_j; + *ryy_j = rtmp2; + }; + yy[0] = rtmp; + j = ryy_j - &(yy[0]); + mtfv[wr] = j+1; wr++; s->mtfFreq[j+1]++; + } + + } + } + + if (zPend > 0) { + zPend--; + while (True) { + if (zPend & 1) { + mtfv[wr] = BZ_RUNB; wr++; + s->mtfFreq[BZ_RUNB]++; + } else { + mtfv[wr] = BZ_RUNA; wr++; + s->mtfFreq[BZ_RUNA]++; + } + if (zPend < 2) break; + zPend = (zPend - 2) / 2; + }; + zPend = 0; + } + + mtfv[wr] = EOB; wr++; s->mtfFreq[EOB]++; + + s->nMTF = wr; +} + + +/*---------------------------------------------------*/ +#define BZ_LESSER_ICOST 0 +#define BZ_GREATER_ICOST 15 + +static +void sendMTFValues ( EState* s ) +{ + Int32 v, t, i, j, gs, ge, totc, bt, bc, iter; + Int32 nSelectors, alphaSize, minLen, maxLen, selCtr; + Int32 nGroups, nBytes; + + /*-- + UChar len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE]; + is a global since the decoder also needs it. + + Int32 code[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE]; + Int32 rfreq[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE]; + are also globals only used in this proc. + Made global to keep stack frame size small. + --*/ + + + UInt16 cost[BZ_N_GROUPS]; + Int32 fave[BZ_N_GROUPS]; + + UInt16* mtfv = s->mtfv; + + if (s->verbosity >= 3) + VPrintf3( " %d in block, %d after MTF & 1-2 coding, " + "%d+2 syms in use\n", + s->nblock, s->nMTF, s->nInUse ); + + alphaSize = s->nInUse+2; + for (t = 0; t < BZ_N_GROUPS; t++) + for (v = 0; v < alphaSize; v++) + s->len[t][v] = BZ_GREATER_ICOST; + + /*--- Decide how many coding tables to use ---*/ + AssertH ( s->nMTF > 0, 3001 ); + if (s->nMTF < 200) nGroups = 2; else + if (s->nMTF < 600) nGroups = 3; else + if (s->nMTF < 1200) nGroups = 4; else + if (s->nMTF < 2400) nGroups = 5; else + nGroups = 6; + + /*--- Generate an initial set of coding tables ---*/ + { + Int32 nPart, remF, tFreq, aFreq; + + nPart = nGroups; + remF = s->nMTF; + gs = 0; + while (nPart > 0) { + tFreq = remF / nPart; + ge = gs-1; + aFreq = 0; + while (aFreq < tFreq && ge < alphaSize-1) { + ge++; + aFreq += s->mtfFreq[ge]; + } + + if (ge > gs + && nPart != nGroups && nPart != 1 + && ((nGroups-nPart) % 2 == 1)) { + aFreq -= s->mtfFreq[ge]; + ge--; + } + + if (0 && s->verbosity >= 3) + VPrintf5( " initial group %d, [%d .. %d], " + "has %d syms (%4.1f%%)\n", + nPart, gs, ge, aFreq, + (100.0 * (float)aFreq) / (float)(s->nMTF) ); + + for (v = 0; v < alphaSize; v++) + if (v >= gs && v <= ge) + s->len[nPart-1][v] = BZ_LESSER_ICOST; else + s->len[nPart-1][v] = BZ_GREATER_ICOST; + + nPart--; + gs = ge+1; + remF -= aFreq; + } + } + + /*--- + Iterate up to BZ_N_ITERS times to improve the tables. + ---*/ + for (iter = 0; iter < BZ_N_ITERS; iter++) { + + for (t = 0; t < nGroups; t++) fave[t] = 0; + + for (t = 0; t < nGroups; t++) + for (v = 0; v < alphaSize; v++) + s->rfreq[t][v] = 0; + + /*--- + Set up an auxiliary length table which is used to fast-track + the common case (nGroups == 6). + ---*/ + if (nGroups == 6) { + for (v = 0; v < alphaSize; v++) { + s->len_pack[v][0] = (s->len[1][v] << 16) | s->len[0][v]; + s->len_pack[v][1] = (s->len[3][v] << 16) | s->len[2][v]; + s->len_pack[v][2] = (s->len[5][v] << 16) | s->len[4][v]; + } + } + + nSelectors = 0; + totc = 0; + gs = 0; + while (True) { + + /*--- Set group start & end marks. --*/ + if (gs >= s->nMTF) break; + ge = gs + BZ_G_SIZE - 1; + if (ge >= s->nMTF) ge = s->nMTF-1; + + /*-- + Calculate the cost of this group as coded + by each of the coding tables. + --*/ + for (t = 0; t < nGroups; t++) cost[t] = 0; + + if (nGroups == 6 && 50 == ge-gs+1) { + /*--- fast track the common case ---*/ + register UInt32 cost01, cost23, cost45; + register UInt16 icv; + cost01 = cost23 = cost45 = 0; + +# define BZ_ITER(nn) \ + icv = mtfv[gs+(nn)]; \ + cost01 += s->len_pack[icv][0]; \ + cost23 += s->len_pack[icv][1]; \ + cost45 += s->len_pack[icv][2]; \ + + BZ_ITER(0); BZ_ITER(1); BZ_ITER(2); BZ_ITER(3); BZ_ITER(4); + BZ_ITER(5); BZ_ITER(6); BZ_ITER(7); BZ_ITER(8); BZ_ITER(9); + BZ_ITER(10); BZ_ITER(11); BZ_ITER(12); BZ_ITER(13); BZ_ITER(14); + BZ_ITER(15); BZ_ITER(16); BZ_ITER(17); BZ_ITER(18); BZ_ITER(19); + BZ_ITER(20); BZ_ITER(21); BZ_ITER(22); BZ_ITER(23); BZ_ITER(24); + BZ_ITER(25); BZ_ITER(26); BZ_ITER(27); BZ_ITER(28); BZ_ITER(29); + BZ_ITER(30); BZ_ITER(31); BZ_ITER(32); BZ_ITER(33); BZ_ITER(34); + BZ_ITER(35); BZ_ITER(36); BZ_ITER(37); BZ_ITER(38); BZ_ITER(39); + BZ_ITER(40); BZ_ITER(41); BZ_ITER(42); BZ_ITER(43); BZ_ITER(44); + BZ_ITER(45); BZ_ITER(46); BZ_ITER(47); BZ_ITER(48); BZ_ITER(49); + +# undef BZ_ITER + + cost[0] = cost01 & 0xffff; cost[1] = cost01 >> 16; + cost[2] = cost23 & 0xffff; cost[3] = cost23 >> 16; + cost[4] = cost45 & 0xffff; cost[5] = cost45 >> 16; + + } else { + /*--- slow version which correctly handles all situations ---*/ + for (i = gs; i <= ge; i++) { + UInt16 icv = mtfv[i]; + for (t = 0; t < nGroups; t++) cost[t] += s->len[t][icv]; + } + } + + /*-- + Find the coding table which is best for this group, + and record its identity in the selector table. + --*/ + bc = 999999999; bt = -1; + for (t = 0; t < nGroups; t++) + if (cost[t] < bc) { bc = cost[t]; bt = t; }; + totc += bc; + fave[bt]++; + s->selector[nSelectors] = bt; + nSelectors++; + + /*-- + Increment the symbol frequencies for the selected table. + --*/ + if (nGroups == 6 && 50 == ge-gs+1) { + /*--- fast track the common case ---*/ + +# define BZ_ITUR(nn) s->rfreq[bt][ mtfv[gs+(nn)] ]++ + + BZ_ITUR(0); BZ_ITUR(1); BZ_ITUR(2); BZ_ITUR(3); BZ_ITUR(4); + BZ_ITUR(5); BZ_ITUR(6); BZ_ITUR(7); BZ_ITUR(8); BZ_ITUR(9); + BZ_ITUR(10); BZ_ITUR(11); BZ_ITUR(12); BZ_ITUR(13); BZ_ITUR(14); + BZ_ITUR(15); BZ_ITUR(16); BZ_ITUR(17); BZ_ITUR(18); BZ_ITUR(19); + BZ_ITUR(20); BZ_ITUR(21); BZ_ITUR(22); BZ_ITUR(23); BZ_ITUR(24); + BZ_ITUR(25); BZ_ITUR(26); BZ_ITUR(27); BZ_ITUR(28); BZ_ITUR(29); + BZ_ITUR(30); BZ_ITUR(31); BZ_ITUR(32); BZ_ITUR(33); BZ_ITUR(34); + BZ_ITUR(35); BZ_ITUR(36); BZ_ITUR(37); BZ_ITUR(38); BZ_ITUR(39); + BZ_ITUR(40); BZ_ITUR(41); BZ_ITUR(42); BZ_ITUR(43); BZ_ITUR(44); + BZ_ITUR(45); BZ_ITUR(46); BZ_ITUR(47); BZ_ITUR(48); BZ_ITUR(49); + +# undef BZ_ITUR + + } else { + /*--- slow version which correctly handles all situations ---*/ + for (i = gs; i <= ge; i++) + s->rfreq[bt][ mtfv[i] ]++; + } + + gs = ge+1; + } + if (s->verbosity >= 3) { + VPrintf2 ( " pass %d: size is %d, grp uses are ", + iter+1, totc/8 ); + for (t = 0; t < nGroups; t++) + VPrintf1 ( "%d ", fave[t] ); + VPrintf0 ( "\n" ); + } + + /*-- + Recompute the tables based on the accumulated frequencies. + --*/ + /* maxLen was changed from 20 to 17 in bzip2-1.0.3. See + comment in huffman.c for details. */ + for (t = 0; t < nGroups; t++) + BZ2_hbMakeCodeLengths ( &(s->len[t][0]), &(s->rfreq[t][0]), + alphaSize, 17 /*20*/ ); + } + + + AssertH( nGroups < 8, 3002 ); + AssertH( nSelectors < 32768 && + nSelectors <= (2 + (900000 / BZ_G_SIZE)), + 3003 ); + + + /*--- Compute MTF values for the selectors. ---*/ + { + UChar pos[BZ_N_GROUPS], ll_i, tmp2, tmp; + for (i = 0; i < nGroups; i++) pos[i] = i; + for (i = 0; i < nSelectors; i++) { + ll_i = s->selector[i]; + j = 0; + tmp = pos[j]; + while ( ll_i != tmp ) { + j++; + tmp2 = tmp; + tmp = pos[j]; + pos[j] = tmp2; + }; + pos[0] = tmp; + s->selectorMtf[i] = j; + } + }; + + /*--- Assign actual codes for the tables. --*/ + for (t = 0; t < nGroups; t++) { + minLen = 32; + maxLen = 0; + for (i = 0; i < alphaSize; i++) { + if (s->len[t][i] > maxLen) maxLen = s->len[t][i]; + if (s->len[t][i] < minLen) minLen = s->len[t][i]; + } + AssertH ( !(maxLen > 17 /*20*/ ), 3004 ); + AssertH ( !(minLen < 1), 3005 ); + BZ2_hbAssignCodes ( &(s->code[t][0]), &(s->len[t][0]), + minLen, maxLen, alphaSize ); + } + + /*--- Transmit the mapping table. ---*/ + { + Bool inUse16[16]; + for (i = 0; i < 16; i++) { + inUse16[i] = False; + for (j = 0; j < 16; j++) + if (s->inUse[i * 16 + j]) inUse16[i] = True; + } + + nBytes = s->numZ; + for (i = 0; i < 16; i++) + if (inUse16[i]) bsW(s,1,1); else bsW(s,1,0); + + for (i = 0; i < 16; i++) + if (inUse16[i]) + for (j = 0; j < 16; j++) { + if (s->inUse[i * 16 + j]) bsW(s,1,1); else bsW(s,1,0); + } + + if (s->verbosity >= 3) + VPrintf1( " bytes: mapping %d, ", s->numZ-nBytes ); + } + + /*--- Now the selectors. ---*/ + nBytes = s->numZ; + bsW ( s, 3, nGroups ); + bsW ( s, 15, nSelectors ); + for (i = 0; i < nSelectors; i++) { + for (j = 0; j < s->selectorMtf[i]; j++) bsW(s,1,1); + bsW(s,1,0); + } + if (s->verbosity >= 3) + VPrintf1( "selectors %d, ", s->numZ-nBytes ); + + /*--- Now the coding tables. ---*/ + nBytes = s->numZ; + + for (t = 0; t < nGroups; t++) { + Int32 curr = s->len[t][0]; + bsW ( s, 5, curr ); + for (i = 0; i < alphaSize; i++) { + while (curr < s->len[t][i]) { bsW(s,2,2); curr++; /* 10 */ }; + while (curr > s->len[t][i]) { bsW(s,2,3); curr--; /* 11 */ }; + bsW ( s, 1, 0 ); + } + } + + if (s->verbosity >= 3) + VPrintf1 ( "code lengths %d, ", s->numZ-nBytes ); + + /*--- And finally, the block data proper ---*/ + nBytes = s->numZ; + selCtr = 0; + gs = 0; + while (True) { + if (gs >= s->nMTF) break; + ge = gs + BZ_G_SIZE - 1; + if (ge >= s->nMTF) ge = s->nMTF-1; + AssertH ( s->selector[selCtr] < nGroups, 3006 ); + + if (nGroups == 6 && 50 == ge-gs+1) { + /*--- fast track the common case ---*/ + UInt16 mtfv_i; + UChar* s_len_sel_selCtr + = &(s->len[s->selector[selCtr]][0]); + Int32* s_code_sel_selCtr + = &(s->code[s->selector[selCtr]][0]); + +# define BZ_ITAH(nn) \ + mtfv_i = mtfv[gs+(nn)]; \ + bsW ( s, \ + s_len_sel_selCtr[mtfv_i], \ + s_code_sel_selCtr[mtfv_i] ) + + BZ_ITAH(0); BZ_ITAH(1); BZ_ITAH(2); BZ_ITAH(3); BZ_ITAH(4); + BZ_ITAH(5); BZ_ITAH(6); BZ_ITAH(7); BZ_ITAH(8); BZ_ITAH(9); + BZ_ITAH(10); BZ_ITAH(11); BZ_ITAH(12); BZ_ITAH(13); BZ_ITAH(14); + BZ_ITAH(15); BZ_ITAH(16); BZ_ITAH(17); BZ_ITAH(18); BZ_ITAH(19); + BZ_ITAH(20); BZ_ITAH(21); BZ_ITAH(22); BZ_ITAH(23); BZ_ITAH(24); + BZ_ITAH(25); BZ_ITAH(26); BZ_ITAH(27); BZ_ITAH(28); BZ_ITAH(29); + BZ_ITAH(30); BZ_ITAH(31); BZ_ITAH(32); BZ_ITAH(33); BZ_ITAH(34); + BZ_ITAH(35); BZ_ITAH(36); BZ_ITAH(37); BZ_ITAH(38); BZ_ITAH(39); + BZ_ITAH(40); BZ_ITAH(41); BZ_ITAH(42); BZ_ITAH(43); BZ_ITAH(44); + BZ_ITAH(45); BZ_ITAH(46); BZ_ITAH(47); BZ_ITAH(48); BZ_ITAH(49); + +# undef BZ_ITAH + + } else { + /*--- slow version which correctly handles all situations ---*/ + for (i = gs; i <= ge; i++) { + bsW ( s, + s->len [s->selector[selCtr]] [mtfv[i]], + s->code [s->selector[selCtr]] [mtfv[i]] ); + } + } + + + gs = ge+1; + selCtr++; + } + AssertH( selCtr == nSelectors, 3007 ); + + if (s->verbosity >= 3) + VPrintf1( "codes %d\n", s->numZ-nBytes ); +} + + +/*---------------------------------------------------*/ +void BZ2_compressBlock ( EState* s, Bool is_last_block ) +{ + if (s->nblock > 0) { + + BZ_FINALISE_CRC ( s->blockCRC ); + s->combinedCRC = (s->combinedCRC << 1) | (s->combinedCRC >> 31); + s->combinedCRC ^= s->blockCRC; + if (s->blockNo > 1) s->numZ = 0; + + if (s->verbosity >= 2) + VPrintf4( " block %d: crc = 0x%08x, " + "combined CRC = 0x%08x, size = %d\n", + s->blockNo, s->blockCRC, s->combinedCRC, s->nblock ); + + BZ2_blockSort ( s ); + } + + s->zbits = (UChar*) (&((UChar*)s->arr2)[s->nblock]); + + /*-- If this is the first block, create the stream header. --*/ + if (s->blockNo == 1) { + BZ2_bsInitWrite ( s ); + bsPutUChar ( s, BZ_HDR_B ); + bsPutUChar ( s, BZ_HDR_Z ); + bsPutUChar ( s, BZ_HDR_h ); + bsPutUChar ( s, (UChar)(BZ_HDR_0 + s->blockSize100k) ); + } + + if (s->nblock > 0) { + + bsPutUChar ( s, 0x31 ); bsPutUChar ( s, 0x41 ); + bsPutUChar ( s, 0x59 ); bsPutUChar ( s, 0x26 ); + bsPutUChar ( s, 0x53 ); bsPutUChar ( s, 0x59 ); + + /*-- Now the block's CRC, so it is in a known place. --*/ + bsPutUInt32 ( s, s->blockCRC ); + + /*-- + Now a single bit indicating (non-)randomisation. + As of version 0.9.5, we use a better sorting algorithm + which makes randomisation unnecessary. So always set + the randomised bit to 'no'. Of course, the decoder + still needs to be able to handle randomised blocks + so as to maintain backwards compatibility with + older versions of bzip2. + --*/ + bsW(s,1,0); + + bsW ( s, 24, s->origPtr ); + generateMTFValues ( s ); + sendMTFValues ( s ); + } + + + /*-- If this is the last block, add the stream trailer. --*/ + if (is_last_block) { + + bsPutUChar ( s, 0x17 ); bsPutUChar ( s, 0x72 ); + bsPutUChar ( s, 0x45 ); bsPutUChar ( s, 0x38 ); + bsPutUChar ( s, 0x50 ); bsPutUChar ( s, 0x90 ); + bsPutUInt32 ( s, s->combinedCRC ); + if (s->verbosity >= 2) + VPrintf1( " final combined CRC = 0x%08x\n ", s->combinedCRC ); + bsFinishWrite ( s ); + } +} + + +/*-------------------------------------------------------------*/ +/*--- end compress.c ---*/ +/*-------------------------------------------------------------*/ + + +/*-------------------------------------------------------------*/ +/*--- Table for randomising repetitive blocks ---*/ +/*--- randtable.c ---*/ +/*-------------------------------------------------------------*/ + +/*-- + This file is a part of bzip2 and/or libbzip2, a program and + library for lossless, block-sorting data compression. + + Copyright (C) 1996-2004 Julian R Seward. All rights reserved. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions + are met: + + 1. Redistributions of source code must retain the above copyright + notice, this list of conditions and the following disclaimer. + + 2. The origin of this software must not be misrepresented; you must + not claim that you wrote the original software. If you use this + software in a product, an acknowledgment in the product + documentation would be appreciated but is not required. + + 3. Altered source versions must be plainly marked as such, and must + not be misrepresented as being the original software. + + 4. The name of the author may not be used to endorse or promote + products derived from this software without specific prior written + permission. + + THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS + OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED + WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY + DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE + GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS + INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, + WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING + NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS + SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + + Julian Seward, Cambridge, UK. + jseward@bzip.org + bzip2/libbzip2 version 1.0 of 21 March 2000 + + This program is based on (at least) the work of: + Mike Burrows + David Wheeler + Peter Fenwick + Alistair Moffat + Radford Neal + Ian H. Witten + Robert Sedgewick + Jon L. Bentley + + For more information on these sources, see the manual. +--*/ + + + + +/*---------------------------------------------*/ +Int32 BZ2_rNums[512] = { + 619, 720, 127, 481, 931, 816, 813, 233, 566, 247, + 985, 724, 205, 454, 863, 491, 741, 242, 949, 214, + 733, 859, 335, 708, 621, 574, 73, 654, 730, 472, + 419, 436, 278, 496, 867, 210, 399, 680, 480, 51, + 878, 465, 811, 169, 869, 675, 611, 697, 867, 561, + 862, 687, 507, 283, 482, 129, 807, 591, 733, 623, + 150, 238, 59, 379, 684, 877, 625, 169, 643, 105, + 170, 607, 520, 932, 727, 476, 693, 425, 174, 647, + 73, 122, 335, 530, 442, 853, 695, 249, 445, 515, + 909, 545, 703, 919, 874, 474, 882, 500, 594, 612, + 641, 801, 220, 162, 819, 984, 589, 513, 495, 799, + 161, 604, 958, 533, 221, 400, 386, 867, 600, 782, + 382, 596, 414, 171, 516, 375, 682, 485, 911, 276, + 98, 553, 163, 354, 666, 933, 424, 341, 533, 870, + 227, 730, 475, 186, 263, 647, 537, 686, 600, 224, + 469, 68, 770, 919, 190, 373, 294, 822, 808, 206, + 184, 943, 795, 384, 383, 461, 404, 758, 839, 887, + 715, 67, 618, 276, 204, 918, 873, 777, 604, 560, + 951, 160, 578, 722, 79, 804, 96, 409, 713, 940, + 652, 934, 970, 447, 318, 353, 859, 672, 112, 785, + 645, 863, 803, 350, 139, 93, 354, 99, 820, 908, + 609, 772, 154, 274, 580, 184, 79, 626, 630, 742, + 653, 282, 762, 623, 680, 81, 927, 626, 789, 125, + 411, 521, 938, 300, 821, 78, 343, 175, 128, 250, + 170, 774, 972, 275, 999, 639, 495, 78, 352, 126, + 857, 956, 358, 619, 580, 124, 737, 594, 701, 612, + 669, 112, 134, 694, 363, 992, 809, 743, 168, 974, + 944, 375, 748, 52, 600, 747, 642, 182, 862, 81, + 344, 805, 988, 739, 511, 655, 814, 334, 249, 515, + 897, 955, 664, 981, 649, 113, 974, 459, 893, 228, + 433, 837, 553, 268, 926, 240, 102, 654, 459, 51, + 686, 754, 806, 760, 493, 403, 415, 394, 687, 700, + 946, 670, 656, 610, 738, 392, 760, 799, 887, 653, + 978, 321, 576, 617, 626, 502, 894, 679, 243, 440, + 680, 879, 194, 572, 640, 724, 926, 56, 204, 700, + 707, 151, 457, 449, 797, 195, 791, 558, 945, 679, + 297, 59, 87, 824, 713, 663, 412, 693, 342, 606, + 134, 108, 571, 364, 631, 212, 174, 643, 304, 329, + 343, 97, 430, 751, 497, 314, 983, 374, 822, 928, + 140, 206, 73, 263, 980, 736, 876, 478, 430, 305, + 170, 514, 364, 692, 829, 82, 855, 953, 676, 246, + 369, 970, 294, 750, 807, 827, 150, 790, 288, 923, + 804, 378, 215, 828, 592, 281, 565, 555, 710, 82, + 896, 831, 547, 261, 524, 462, 293, 465, 502, 56, + 661, 821, 976, 991, 658, 869, 905, 758, 745, 193, + 768, 550, 608, 933, 378, 286, 215, 979, 792, 961, + 61, 688, 793, 644, 986, 403, 106, 366, 905, 644, + 372, 567, 466, 434, 645, 210, 389, 550, 919, 135, + 780, 773, 635, 389, 707, 100, 626, 958, 165, 504, + 920, 176, 193, 713, 857, 265, 203, 50, 668, 108, + 645, 990, 626, 197, 510, 357, 358, 850, 858, 364, + 936, 638 +}; + + +/*-------------------------------------------------------------*/ +/*--- end randtable.c ---*/ +/*-------------------------------------------------------------*/ + +/*-------------------------------------------------------------*/ +/*--- Table for doing CRCs ---*/ +/*--- crctable.c ---*/ +/*-------------------------------------------------------------*/ + +/*-- + This file is a part of bzip2 and/or libbzip2, a program and + library for lossless, block-sorting data compression. + + Copyright (C) 1996-2004 Julian R Seward. All rights reserved. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions + are met: + + 1. Redistributions of source code must retain the above copyright + notice, this list of conditions and the following disclaimer. + + 2. The origin of this software must not be misrepresented; you must + not claim that you wrote the original software. If you use this + software in a product, an acknowledgment in the product + documentation would be appreciated but is not required. + + 3. Altered source versions must be plainly marked as such, and must + not be misrepresented as being the original software. + + 4. The name of the author may not be used to endorse or promote + products derived from this software without specific prior written + permission. + + THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS + OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED + WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY + DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE + GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS + INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, + WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING + NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS + SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + + Julian Seward, Cambridge, UK. + jseward@bzip.org + bzip2/libbzip2 version 1.0 of 21 March 2000 + + This program is based on (at least) the work of: + Mike Burrows + David Wheeler + Peter Fenwick + Alistair Moffat + Radford Neal + Ian H. Witten + Robert Sedgewick + Jon L. Bentley + + For more information on these sources, see the manual. +--*/ + + + + + +/*-- + I think this is an implementation of the AUTODIN-II, + Ethernet & FDDI 32-bit CRC standard. Vaguely derived + from code by Rob Warnock, in Section 51 of the + comp.compression FAQ. +--*/ + +UInt32 BZ2_crc32Table[256] = { + + /*-- Ugly, innit? --*/ + + 0x00000000L, 0x04c11db7L, 0x09823b6eL, 0x0d4326d9L, + 0x130476dcL, 0x17c56b6bL, 0x1a864db2L, 0x1e475005L, + 0x2608edb8L, 0x22c9f00fL, 0x2f8ad6d6L, 0x2b4bcb61L, + 0x350c9b64L, 0x31cd86d3L, 0x3c8ea00aL, 0x384fbdbdL, + 0x4c11db70L, 0x48d0c6c7L, 0x4593e01eL, 0x4152fda9L, + 0x5f15adacL, 0x5bd4b01bL, 0x569796c2L, 0x52568b75L, + 0x6a1936c8L, 0x6ed82b7fL, 0x639b0da6L, 0x675a1011L, + 0x791d4014L, 0x7ddc5da3L, 0x709f7b7aL, 0x745e66cdL, + 0x9823b6e0L, 0x9ce2ab57L, 0x91a18d8eL, 0x95609039L, + 0x8b27c03cL, 0x8fe6dd8bL, 0x82a5fb52L, 0x8664e6e5L, + 0xbe2b5b58L, 0xbaea46efL, 0xb7a96036L, 0xb3687d81L, + 0xad2f2d84L, 0xa9ee3033L, 0xa4ad16eaL, 0xa06c0b5dL, + 0xd4326d90L, 0xd0f37027L, 0xddb056feL, 0xd9714b49L, + 0xc7361b4cL, 0xc3f706fbL, 0xceb42022L, 0xca753d95L, + 0xf23a8028L, 0xf6fb9d9fL, 0xfbb8bb46L, 0xff79a6f1L, + 0xe13ef6f4L, 0xe5ffeb43L, 0xe8bccd9aL, 0xec7dd02dL, + 0x34867077L, 0x30476dc0L, 0x3d044b19L, 0x39c556aeL, + 0x278206abL, 0x23431b1cL, 0x2e003dc5L, 0x2ac12072L, + 0x128e9dcfL, 0x164f8078L, 0x1b0ca6a1L, 0x1fcdbb16L, + 0x018aeb13L, 0x054bf6a4L, 0x0808d07dL, 0x0cc9cdcaL, + 0x7897ab07L, 0x7c56b6b0L, 0x71159069L, 0x75d48ddeL, + 0x6b93dddbL, 0x6f52c06cL, 0x6211e6b5L, 0x66d0fb02L, + 0x5e9f46bfL, 0x5a5e5b08L, 0x571d7dd1L, 0x53dc6066L, + 0x4d9b3063L, 0x495a2dd4L, 0x44190b0dL, 0x40d816baL, + 0xaca5c697L, 0xa864db20L, 0xa527fdf9L, 0xa1e6e04eL, + 0xbfa1b04bL, 0xbb60adfcL, 0xb6238b25L, 0xb2e29692L, + 0x8aad2b2fL, 0x8e6c3698L, 0x832f1041L, 0x87ee0df6L, + 0x99a95df3L, 0x9d684044L, 0x902b669dL, 0x94ea7b2aL, + 0xe0b41de7L, 0xe4750050L, 0xe9362689L, 0xedf73b3eL, + 0xf3b06b3bL, 0xf771768cL, 0xfa325055L, 0xfef34de2L, + 0xc6bcf05fL, 0xc27dede8L, 0xcf3ecb31L, 0xcbffd686L, + 0xd5b88683L, 0xd1799b34L, 0xdc3abdedL, 0xd8fba05aL, + 0x690ce0eeL, 0x6dcdfd59L, 0x608edb80L, 0x644fc637L, + 0x7a089632L, 0x7ec98b85L, 0x738aad5cL, 0x774bb0ebL, + 0x4f040d56L, 0x4bc510e1L, 0x46863638L, 0x42472b8fL, + 0x5c007b8aL, 0x58c1663dL, 0x558240e4L, 0x51435d53L, + 0x251d3b9eL, 0x21dc2629L, 0x2c9f00f0L, 0x285e1d47L, + 0x36194d42L, 0x32d850f5L, 0x3f9b762cL, 0x3b5a6b9bL, + 0x0315d626L, 0x07d4cb91L, 0x0a97ed48L, 0x0e56f0ffL, + 0x1011a0faL, 0x14d0bd4dL, 0x19939b94L, 0x1d528623L, + 0xf12f560eL, 0xf5ee4bb9L, 0xf8ad6d60L, 0xfc6c70d7L, + 0xe22b20d2L, 0xe6ea3d65L, 0xeba91bbcL, 0xef68060bL, + 0xd727bbb6L, 0xd3e6a601L, 0xdea580d8L, 0xda649d6fL, + 0xc423cd6aL, 0xc0e2d0ddL, 0xcda1f604L, 0xc960ebb3L, + 0xbd3e8d7eL, 0xb9ff90c9L, 0xb4bcb610L, 0xb07daba7L, + 0xae3afba2L, 0xaafbe615L, 0xa7b8c0ccL, 0xa379dd7bL, + 0x9b3660c6L, 0x9ff77d71L, 0x92b45ba8L, 0x9675461fL, + 0x8832161aL, 0x8cf30badL, 0x81b02d74L, 0x857130c3L, + 0x5d8a9099L, 0x594b8d2eL, 0x5408abf7L, 0x50c9b640L, + 0x4e8ee645L, 0x4a4ffbf2L, 0x470cdd2bL, 0x43cdc09cL, + 0x7b827d21L, 0x7f436096L, 0x7200464fL, 0x76c15bf8L, + 0x68860bfdL, 0x6c47164aL, 0x61043093L, 0x65c52d24L, + 0x119b4be9L, 0x155a565eL, 0x18197087L, 0x1cd86d30L, + 0x029f3d35L, 0x065e2082L, 0x0b1d065bL, 0x0fdc1becL, + 0x3793a651L, 0x3352bbe6L, 0x3e119d3fL, 0x3ad08088L, + 0x2497d08dL, 0x2056cd3aL, 0x2d15ebe3L, 0x29d4f654L, + 0xc5a92679L, 0xc1683bceL, 0xcc2b1d17L, 0xc8ea00a0L, + 0xd6ad50a5L, 0xd26c4d12L, 0xdf2f6bcbL, 0xdbee767cL, + 0xe3a1cbc1L, 0xe760d676L, 0xea23f0afL, 0xeee2ed18L, + 0xf0a5bd1dL, 0xf464a0aaL, 0xf9278673L, 0xfde69bc4L, + 0x89b8fd09L, 0x8d79e0beL, 0x803ac667L, 0x84fbdbd0L, + 0x9abc8bd5L, 0x9e7d9662L, 0x933eb0bbL, 0x97ffad0cL, + 0xafb010b1L, 0xab710d06L, 0xa6322bdfL, 0xa2f33668L, + 0xbcb4666dL, 0xb8757bdaL, 0xb5365d03L, 0xb1f740b4L +}; + + +/*-------------------------------------------------------------*/ +/*--- end crctable.c ---*/ +/*-------------------------------------------------------------*/ + +/*-------------------------------------------------------------*/ +/*--- Library top-level functions. ---*/ +/*--- bzlib.c ---*/ +/*-------------------------------------------------------------*/ + +/*-- + This file is a part of bzip2 and/or libbzip2, a program and + library for lossless, block-sorting data compression. + + Copyright (C) 1996-2004 Julian R Seward. All rights reserved. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions + are met: + + 1. Redistributions of source code must retain the above copyright + notice, this list of conditions and the following disclaimer. + + 2. The origin of this software must not be misrepresented; you must + not claim that you wrote the original software. If you use this + software in a product, an acknowledgment in the product + documentation would be appreciated but is not required. + + 3. Altered source versions must be plainly marked as such, and must + not be misrepresented as being the original software. + + 4. The name of the author may not be used to endorse or promote + products derived from this software without specific prior written + permission. + + THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS + OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED + WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY + DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE + GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS + INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, + WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING + NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS + SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + + Julian Seward, Cambridge, UK. + jseward@bzip.org + bzip2/libbzip2 version 1.0 of 21 March 2000 + + This program is based on (at least) the work of: + Mike Burrows + David Wheeler + Peter Fenwick + Alistair Moffat + Radford Neal + Ian H. Witten + Robert Sedgewick + Jon L. Bentley + + For more information on these sources, see the manual. +--*/ + +/*-- + CHANGES + ~~~~~~~ + 0.9.0 -- original version. + + 0.9.0a/b -- no changes in this file. + + 0.9.0c + * made zero-length BZ_FLUSH work correctly in bzCompress(). + * fixed bzWrite/bzRead to ignore zero-length requests. + * fixed bzread to correctly handle read requests after EOF. + * wrong parameter order in call to bzDecompressInit in + bzBuffToBuffDecompress. Fixed. +--*/ + + + +/*---------------------------------------------------*/ +/*--- Compression stuff ---*/ +/*---------------------------------------------------*/ + + +/*---------------------------------------------------*/ +void BZ2_bz__AssertH__fail ( int errcode ) +{ + vex_printf("BZ2_bz__AssertH__fail(%d) called, exiting\n", errcode); + (*serviceFn)(0,0); +} + +void bz_internal_error ( int errcode ) +{ + vex_printf("bz_internal_error called, exiting\n", errcode); + (*serviceFn)(0,0); +} + +/*---------------------------------------------------*/ +static +int bz_config_ok ( void ) +{ + if (sizeof(int) != 4) return 0; + if (sizeof(short) != 2) return 0; + if (sizeof(char) != 1) return 0; + return 1; +} + + +/*---------------------------------------------------*/ +static +void* default_bzalloc ( void* opaque, Int32 items, Int32 size ) +{ + void* v = (void*) (*serviceFn)(2, items * size ); + return v; +} + +static +void default_bzfree ( void* opaque, void* addr ) +{ + if (addr != NULL) (*serviceFn)( 3, (HWord)addr ); +} + + +/*---------------------------------------------------*/ +static +void prepare_new_block ( EState* s ) +{ + Int32 i; + s->nblock = 0; + s->numZ = 0; + s->state_out_pos = 0; + BZ_INITIALISE_CRC ( s->blockCRC ); + for (i = 0; i < 256; i++) s->inUse[i] = False; + s->blockNo++; +} + + +/*---------------------------------------------------*/ +static +void init_RL ( EState* s ) +{ + s->state_in_ch = 256; + s->state_in_len = 0; +} + + +static +Bool isempty_RL ( EState* s ) +{ + if (s->state_in_ch < 256 && s->state_in_len > 0) + return False; else + return True; +} + + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzCompressInit) + ( bz_stream* strm, + int blockSize100k, + int verbosity, + int workFactor ) +{ + Int32 n; + EState* s; + + if (!bz_config_ok()) return BZ_CONFIG_ERROR; + + if (strm == NULL || + blockSize100k < 1 || blockSize100k > 9 || + workFactor < 0 || workFactor > 250) + return BZ_PARAM_ERROR; + + if (workFactor == 0) workFactor = 30; + if (strm->bzalloc == NULL) strm->bzalloc = default_bzalloc; + if (strm->bzfree == NULL) strm->bzfree = default_bzfree; + + s = BZALLOC( sizeof(EState) ); + if (s == NULL) return BZ_MEM_ERROR; + s->strm = strm; + + s->arr1 = NULL; + s->arr2 = NULL; + s->ftab = NULL; + + n = 100000 * blockSize100k; + s->arr1 = BZALLOC( n * sizeof(UInt32) ); + s->arr2 = BZALLOC( (n+BZ_N_OVERSHOOT) * sizeof(UInt32) ); + s->ftab = BZALLOC( 65537 * sizeof(UInt32) ); + + if (s->arr1 == NULL || s->arr2 == NULL || s->ftab == NULL) { + if (s->arr1 != NULL) BZFREE(s->arr1); + if (s->arr2 != NULL) BZFREE(s->arr2); + if (s->ftab != NULL) BZFREE(s->ftab); + if (s != NULL) BZFREE(s); + return BZ_MEM_ERROR; + } + + s->blockNo = 0; + s->state = BZ_S_INPUT; + s->mode = BZ_M_RUNNING; + s->combinedCRC = 0; + s->blockSize100k = blockSize100k; + s->nblockMAX = 100000 * blockSize100k - 19; + s->verbosity = verbosity; + s->workFactor = workFactor; + + s->block = (UChar*)s->arr2; + s->mtfv = (UInt16*)s->arr1; + s->zbits = NULL; + s->ptr = (UInt32*)s->arr1; + + strm->state = s; + strm->total_in_lo32 = 0; + strm->total_in_hi32 = 0; + strm->total_out_lo32 = 0; + strm->total_out_hi32 = 0; + init_RL ( s ); + prepare_new_block ( s ); + return BZ_OK; +} + + +/*---------------------------------------------------*/ +static +void add_pair_to_block ( EState* s ) +{ + Int32 i; + UChar ch = (UChar)(s->state_in_ch); + for (i = 0; i < s->state_in_len; i++) { + BZ_UPDATE_CRC( s->blockCRC, ch ); + } + s->inUse[s->state_in_ch] = True; + switch (s->state_in_len) { + case 1: + s->block[s->nblock] = (UChar)ch; s->nblock++; + break; + case 2: + s->block[s->nblock] = (UChar)ch; s->nblock++; + s->block[s->nblock] = (UChar)ch; s->nblock++; + break; + case 3: + s->block[s->nblock] = (UChar)ch; s->nblock++; + s->block[s->nblock] = (UChar)ch; s->nblock++; + s->block[s->nblock] = (UChar)ch; s->nblock++; + break; + default: + s->inUse[s->state_in_len-4] = True; + s->block[s->nblock] = (UChar)ch; s->nblock++; + s->block[s->nblock] = (UChar)ch; s->nblock++; + s->block[s->nblock] = (UChar)ch; s->nblock++; + s->block[s->nblock] = (UChar)ch; s->nblock++; + s->block[s->nblock] = ((UChar)(s->state_in_len-4)); + s->nblock++; + break; + } +} + + +/*---------------------------------------------------*/ +static +void flush_RL ( EState* s ) +{ + if (s->state_in_ch < 256) add_pair_to_block ( s ); + init_RL ( s ); +} + + +/*---------------------------------------------------*/ +#define ADD_CHAR_TO_BLOCK(zs,zchh0) \ +{ \ + UInt32 zchh = (UInt32)(zchh0); \ + /*-- fast track the common case --*/ \ + if (zchh != zs->state_in_ch && \ + zs->state_in_len == 1) { \ + UChar ch = (UChar)(zs->state_in_ch); \ + BZ_UPDATE_CRC( zs->blockCRC, ch ); \ + zs->inUse[zs->state_in_ch] = True; \ + zs->block[zs->nblock] = (UChar)ch; \ + zs->nblock++; \ + zs->state_in_ch = zchh; \ + } \ + else \ + /*-- general, uncommon cases --*/ \ + if (zchh != zs->state_in_ch || \ + zs->state_in_len == 255) { \ + if (zs->state_in_ch < 256) \ + add_pair_to_block ( zs ); \ + zs->state_in_ch = zchh; \ + zs->state_in_len = 1; \ + } else { \ + zs->state_in_len++; \ + } \ +} + + +/*---------------------------------------------------*/ +static +Bool copy_input_until_stop ( EState* s ) +{ + Bool progress_in = False; + + if (s->mode == BZ_M_RUNNING) { + + /*-- fast track the common case --*/ + while (True) { + /*-- block full? --*/ + if (s->nblock >= s->nblockMAX) break; + /*-- no input? --*/ + if (s->strm->avail_in == 0) break; + progress_in = True; + ADD_CHAR_TO_BLOCK ( s, (UInt32)(*((UChar*)(s->strm->next_in))) ); + s->strm->next_in++; + s->strm->avail_in--; + s->strm->total_in_lo32++; + if (s->strm->total_in_lo32 == 0) s->strm->total_in_hi32++; + } + + } else { + + /*-- general, uncommon case --*/ + while (True) { + /*-- block full? --*/ + if (s->nblock >= s->nblockMAX) break; + /*-- no input? --*/ + if (s->strm->avail_in == 0) break; + /*-- flush/finish end? --*/ + if (s->avail_in_expect == 0) break; + progress_in = True; + ADD_CHAR_TO_BLOCK ( s, (UInt32)(*((UChar*)(s->strm->next_in))) ); + s->strm->next_in++; + s->strm->avail_in--; + s->strm->total_in_lo32++; + if (s->strm->total_in_lo32 == 0) s->strm->total_in_hi32++; + s->avail_in_expect--; + } + } + return progress_in; +} + + +/*---------------------------------------------------*/ +static +Bool copy_output_until_stop ( EState* s ) +{ + Bool progress_out = False; + + while (True) { + + /*-- no output space? --*/ + if (s->strm->avail_out == 0) break; + + /*-- block done? --*/ + if (s->state_out_pos >= s->numZ) break; + + progress_out = True; + *(s->strm->next_out) = s->zbits[s->state_out_pos]; + s->state_out_pos++; + s->strm->avail_out--; + s->strm->next_out++; + s->strm->total_out_lo32++; + if (s->strm->total_out_lo32 == 0) s->strm->total_out_hi32++; + } + + return progress_out; +} + + +/*---------------------------------------------------*/ +static +Bool handle_compress ( bz_stream* strm ) +{ + Bool progress_in = False; + Bool progress_out = False; + EState* s = strm->state; + + while (True) { + + if (s->state == BZ_S_OUTPUT) { + progress_out |= copy_output_until_stop ( s ); + if (s->state_out_pos < s->numZ) break; + if (s->mode == BZ_M_FINISHING && + s->avail_in_expect == 0 && + isempty_RL(s)) break; + prepare_new_block ( s ); + s->state = BZ_S_INPUT; + if (s->mode == BZ_M_FLUSHING && + s->avail_in_expect == 0 && + isempty_RL(s)) break; + } + + if (s->state == BZ_S_INPUT) { + progress_in |= copy_input_until_stop ( s ); + if (s->mode != BZ_M_RUNNING && s->avail_in_expect == 0) { + flush_RL ( s ); + BZ2_compressBlock ( s, (Bool)(s->mode == BZ_M_FINISHING) ); + s->state = BZ_S_OUTPUT; + } + else + if (s->nblock >= s->nblockMAX) { + BZ2_compressBlock ( s, False ); + s->state = BZ_S_OUTPUT; + } + else + if (s->strm->avail_in == 0) { + break; + } + } + + } + + return progress_in || progress_out; +} + + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzCompress) ( bz_stream *strm, int action ) +{ + Bool progress; + EState* s; + if (strm == NULL) return BZ_PARAM_ERROR; + s = strm->state; + if (s == NULL) return BZ_PARAM_ERROR; + if (s->strm != strm) return BZ_PARAM_ERROR; + + preswitch: + switch (s->mode) { + + case BZ_M_IDLE: + return BZ_SEQUENCE_ERROR; + + case BZ_M_RUNNING: + if (action == BZ_RUN) { + progress = handle_compress ( strm ); + return progress ? BZ_RUN_OK : BZ_PARAM_ERROR; + } + else + if (action == BZ_FLUSH) { + s->avail_in_expect = strm->avail_in; + s->mode = BZ_M_FLUSHING; + goto preswitch; + } + else + if (action == BZ_FINISH) { + s->avail_in_expect = strm->avail_in; + s->mode = BZ_M_FINISHING; + goto preswitch; + } + else + return BZ_PARAM_ERROR; + + case BZ_M_FLUSHING: + if (action != BZ_FLUSH) return BZ_SEQUENCE_ERROR; + if (s->avail_in_expect != s->strm->avail_in) + return BZ_SEQUENCE_ERROR; + progress = handle_compress ( strm ); + if (s->avail_in_expect > 0 || !isempty_RL(s) || + s->state_out_pos < s->numZ) return BZ_FLUSH_OK; + s->mode = BZ_M_RUNNING; + return BZ_RUN_OK; + + case BZ_M_FINISHING: + if (action != BZ_FINISH) return BZ_SEQUENCE_ERROR; + if (s->avail_in_expect != s->strm->avail_in) + return BZ_SEQUENCE_ERROR; + progress = handle_compress ( strm ); + if (!progress) return BZ_SEQUENCE_ERROR; + if (s->avail_in_expect > 0 || !isempty_RL(s) || + s->state_out_pos < s->numZ) return BZ_FINISH_OK; + s->mode = BZ_M_IDLE; + return BZ_STREAM_END; + } + return BZ_OK; /*--not reached--*/ +} + + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzCompressEnd) ( bz_stream *strm ) +{ + EState* s; + if (strm == NULL) return BZ_PARAM_ERROR; + s = strm->state; + if (s == NULL) return BZ_PARAM_ERROR; + if (s->strm != strm) return BZ_PARAM_ERROR; + + if (s->arr1 != NULL) BZFREE(s->arr1); + if (s->arr2 != NULL) BZFREE(s->arr2); + if (s->ftab != NULL) BZFREE(s->ftab); + BZFREE(strm->state); + + strm->state = NULL; + + return BZ_OK; +} + + +/*---------------------------------------------------*/ +/*--- Decompression stuff ---*/ +/*---------------------------------------------------*/ + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzDecompressInit) + ( bz_stream* strm, + int verbosity, + int small ) +{ + DState* s; + + if (!bz_config_ok()) return BZ_CONFIG_ERROR; + + if (strm == NULL) return BZ_PARAM_ERROR; + if (small != 0 && small != 1) return BZ_PARAM_ERROR; + if (verbosity < 0 || verbosity > 4) return BZ_PARAM_ERROR; + + if (strm->bzalloc == NULL) strm->bzalloc = default_bzalloc; + if (strm->bzfree == NULL) strm->bzfree = default_bzfree; + + s = BZALLOC( sizeof(DState) ); + if (s == NULL) return BZ_MEM_ERROR; + s->strm = strm; + strm->state = s; + s->state = BZ_X_MAGIC_1; + s->bsLive = 0; + s->bsBuff = 0; + s->calculatedCombinedCRC = 0; + strm->total_in_lo32 = 0; + strm->total_in_hi32 = 0; + strm->total_out_lo32 = 0; + strm->total_out_hi32 = 0; + s->smallDecompress = (Bool)small; + s->ll4 = NULL; + s->ll16 = NULL; + s->tt = NULL; + s->currBlockNo = 0; + s->verbosity = verbosity; + + return BZ_OK; +} + + +/*---------------------------------------------------*/ +/* Return True iff data corruption is discovered. + Returns False if there is no problem. +*/ +static +Bool unRLE_obuf_to_output_FAST ( DState* s ) +{ + UChar k1; + + if (s->blockRandomised) { + + while (True) { + /* try to finish existing run */ + while (True) { + if (s->strm->avail_out == 0) return False; + if (s->state_out_len == 0) break; + *( (UChar*)(s->strm->next_out) ) = s->state_out_ch; + BZ_UPDATE_CRC ( s->calculatedBlockCRC, s->state_out_ch ); + s->state_out_len--; + s->strm->next_out++; + s->strm->avail_out--; + s->strm->total_out_lo32++; + if (s->strm->total_out_lo32 == 0) s->strm->total_out_hi32++; + } + + /* can a new run be started? */ + if (s->nblock_used == s->save_nblock+1) return False; + + /* Only caused by corrupt data stream? */ + if (s->nblock_used > s->save_nblock+1) + return True; + + s->state_out_len = 1; + s->state_out_ch = s->k0; + BZ_GET_FAST(k1); BZ_RAND_UPD_MASK; + k1 ^= BZ_RAND_MASK; s->nblock_used++; + if (s->nblock_used == s->save_nblock+1) continue; + if (k1 != s->k0) { s->k0 = k1; continue; }; + + s->state_out_len = 2; + BZ_GET_FAST(k1); BZ_RAND_UPD_MASK; + k1 ^= BZ_RAND_MASK; s->nblock_used++; + if (s->nblock_used == s->save_nblock+1) continue; + if (k1 != s->k0) { s->k0 = k1; continue; }; + + s->state_out_len = 3; + BZ_GET_FAST(k1); BZ_RAND_UPD_MASK; + k1 ^= BZ_RAND_MASK; s->nblock_used++; + if (s->nblock_used == s->save_nblock+1) continue; + if (k1 != s->k0) { s->k0 = k1; continue; }; + + BZ_GET_FAST(k1); BZ_RAND_UPD_MASK; + k1 ^= BZ_RAND_MASK; s->nblock_used++; + s->state_out_len = ((Int32)k1) + 4; + BZ_GET_FAST(s->k0); BZ_RAND_UPD_MASK; + s->k0 ^= BZ_RAND_MASK; s->nblock_used++; + } + + } else { + + /* restore */ + UInt32 c_calculatedBlockCRC = s->calculatedBlockCRC; + UChar c_state_out_ch = s->state_out_ch; + Int32 c_state_out_len = s->state_out_len; + Int32 c_nblock_used = s->nblock_used; + Int32 c_k0 = s->k0; + UInt32* c_tt = s->tt; + UInt32 c_tPos = s->tPos; + char* cs_next_out = s->strm->next_out; + unsigned int cs_avail_out = s->strm->avail_out; + /* end restore */ + + UInt32 avail_out_INIT = cs_avail_out; + Int32 s_save_nblockPP = s->save_nblock+1; + unsigned int total_out_lo32_old; + + while (True) { + + /* try to finish existing run */ + if (c_state_out_len > 0) { + while (True) { + if (cs_avail_out == 0) goto return_notr; + if (c_state_out_len == 1) break; + *( (UChar*)(cs_next_out) ) = c_state_out_ch; + BZ_UPDATE_CRC ( c_calculatedBlockCRC, c_state_out_ch ); + c_state_out_len--; + cs_next_out++; + cs_avail_out--; + } + s_state_out_len_eq_one: + { + if (cs_avail_out == 0) { + c_state_out_len = 1; goto return_notr; + }; + *( (UChar*)(cs_next_out) ) = c_state_out_ch; + BZ_UPDATE_CRC ( c_calculatedBlockCRC, c_state_out_ch ); + cs_next_out++; + cs_avail_out--; + } + } + /* Only caused by corrupt data stream? */ + if (c_nblock_used > s_save_nblockPP) + return True; + + /* can a new run be started? */ + if (c_nblock_used == s_save_nblockPP) { + c_state_out_len = 0; goto return_notr; + }; + c_state_out_ch = c_k0; + BZ_GET_FAST_C(k1); c_nblock_used++; + if (k1 != c_k0) { + c_k0 = k1; goto s_state_out_len_eq_one; + }; + if (c_nblock_used == s_save_nblockPP) + goto s_state_out_len_eq_one; + + c_state_out_len = 2; + BZ_GET_FAST_C(k1); c_nblock_used++; + if (c_nblock_used == s_save_nblockPP) continue; + if (k1 != c_k0) { c_k0 = k1; continue; }; + + c_state_out_len = 3; + BZ_GET_FAST_C(k1); c_nblock_used++; + if (c_nblock_used == s_save_nblockPP) continue; + if (k1 != c_k0) { c_k0 = k1; continue; }; + + BZ_GET_FAST_C(k1); c_nblock_used++; + c_state_out_len = ((Int32)k1) + 4; + BZ_GET_FAST_C(c_k0); c_nblock_used++; + } + + return_notr: + total_out_lo32_old = s->strm->total_out_lo32; + s->strm->total_out_lo32 += (avail_out_INIT - cs_avail_out); + if (s->strm->total_out_lo32 < total_out_lo32_old) + s->strm->total_out_hi32++; + + /* save */ + s->calculatedBlockCRC = c_calculatedBlockCRC; + s->state_out_ch = c_state_out_ch; + s->state_out_len = c_state_out_len; + s->nblock_used = c_nblock_used; + s->k0 = c_k0; + s->tt = c_tt; + s->tPos = c_tPos; + s->strm->next_out = cs_next_out; + s->strm->avail_out = cs_avail_out; + /* end save */ + } + return False; +} + + + +/*---------------------------------------------------*/ +/* Return True iff data corruption is discovered. + Returns False if there is no problem. +*/ +static +Bool unRLE_obuf_to_output_SMALL ( DState* s ) +{ + UChar k1; + + if (s->blockRandomised) { + + while (True) { + /* try to finish existing run */ + while (True) { + if (s->strm->avail_out == 0) return False; + if (s->state_out_len == 0) break; + *( (UChar*)(s->strm->next_out) ) = s->state_out_ch; + BZ_UPDATE_CRC ( s->calculatedBlockCRC, s->state_out_ch ); + s->state_out_len--; + s->strm->next_out++; + s->strm->avail_out--; + s->strm->total_out_lo32++; + if (s->strm->total_out_lo32 == 0) s->strm->total_out_hi32++; + } + + /* can a new run be started? */ + if (s->nblock_used == s->save_nblock+1) return False; + + /* Only caused by corrupt data stream? */ + if (s->nblock_used > s->save_nblock+1) + return True; + + s->state_out_len = 1; + s->state_out_ch = s->k0; + BZ_GET_SMALL(k1); BZ_RAND_UPD_MASK; + k1 ^= BZ_RAND_MASK; s->nblock_used++; + if (s->nblock_used == s->save_nblock+1) continue; + if (k1 != s->k0) { s->k0 = k1; continue; }; + + s->state_out_len = 2; + BZ_GET_SMALL(k1); BZ_RAND_UPD_MASK; + k1 ^= BZ_RAND_MASK; s->nblock_used++; + if (s->nblock_used == s->save_nblock+1) continue; + if (k1 != s->k0) { s->k0 = k1; continue; }; + + s->state_out_len = 3; + BZ_GET_SMALL(k1); BZ_RAND_UPD_MASK; + k1 ^= BZ_RAND_MASK; s->nblock_used++; + if (s->nblock_used == s->save_nblock+1) continue; + if (k1 != s->k0) { s->k0 = k1; continue; }; + + BZ_GET_SMALL(k1); BZ_RAND_UPD_MASK; + k1 ^= BZ_RAND_MASK; s->nblock_used++; + s->state_out_len = ((Int32)k1) + 4; + BZ_GET_SMALL(s->k0); BZ_RAND_UPD_MASK; + s->k0 ^= BZ_RAND_MASK; s->nblock_used++; + } + + } else { + + while (True) { + /* try to finish existing run */ + while (True) { + if (s->strm->avail_out == 0) return False; + if (s->state_out_len == 0) break; + *( (UChar*)(s->strm->next_out) ) = s->state_out_ch; + BZ_UPDATE_CRC ( s->calculatedBlockCRC, s->state_out_ch ); + s->state_out_len--; + s->strm->next_out++; + s->strm->avail_out--; + s->strm->total_out_lo32++; + if (s->strm->total_out_lo32 == 0) s->strm->total_out_hi32++; + } + + /* can a new run be started? */ + if (s->nblock_used == s->save_nblock+1) return False; + + /* Only caused by corrupt data stream? */ + if (s->nblock_used > s->save_nblock+1) + return True; + + s->state_out_len = 1; + s->state_out_ch = s->k0; + BZ_GET_SMALL(k1); s->nblock_used++; + if (s->nblock_used == s->save_nblock+1) continue; + if (k1 != s->k0) { s->k0 = k1; continue; }; + + s->state_out_len = 2; + BZ_GET_SMALL(k1); s->nblock_used++; + if (s->nblock_used == s->save_nblock+1) continue; + if (k1 != s->k0) { s->k0 = k1; continue; }; + + s->state_out_len = 3; + BZ_GET_SMALL(k1); s->nblock_used++; + if (s->nblock_used == s->save_nblock+1) continue; + if (k1 != s->k0) { s->k0 = k1; continue; }; + + BZ_GET_SMALL(k1); s->nblock_used++; + s->state_out_len = ((Int32)k1) + 4; + BZ_GET_SMALL(s->k0); s->nblock_used++; + } + + } +} + + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzDecompress) ( bz_stream *strm ) +{ + Bool corrupt; + DState* s; + if (strm == NULL) return BZ_PARAM_ERROR; + s = strm->state; + if (s == NULL) return BZ_PARAM_ERROR; + if (s->strm != strm) return BZ_PARAM_ERROR; + + while (True) { + if (s->state == BZ_X_IDLE) return BZ_SEQUENCE_ERROR; + if (s->state == BZ_X_OUTPUT) { + if (s->smallDecompress) + corrupt = unRLE_obuf_to_output_SMALL ( s ); else + corrupt = unRLE_obuf_to_output_FAST ( s ); + if (corrupt) return BZ_DATA_ERROR; + if (s->nblock_used == s->save_nblock+1 && s->state_out_len == 0) { + BZ_FINALISE_CRC ( s->calculatedBlockCRC ); + if (s->verbosity >= 3) + VPrintf2 ( " {0x%08x, 0x%08x}", s->storedBlockCRC, + s->calculatedBlockCRC ); + if (s->verbosity >= 2) VPrintf0 ( "]" ); + if (s->calculatedBlockCRC != s->storedBlockCRC) + return BZ_DATA_ERROR; + s->calculatedCombinedCRC + = (s->calculatedCombinedCRC << 1) | + (s->calculatedCombinedCRC >> 31); + s->calculatedCombinedCRC ^= s->calculatedBlockCRC; + s->state = BZ_X_BLKHDR_1; + } else { + return BZ_OK; + } + } + if (s->state >= BZ_X_MAGIC_1) { + Int32 r = BZ2_decompress ( s ); + if (r == BZ_STREAM_END) { + if (s->verbosity >= 3) + VPrintf2 ( "\n combined CRCs: stored = 0x%08x, computed = 0x%08x", + s->storedCombinedCRC, s->calculatedCombinedCRC ); + if (s->calculatedCombinedCRC != s->storedCombinedCRC) + return BZ_DATA_ERROR; + return r; + } + if (s->state != BZ_X_OUTPUT) return r; + } + } + + AssertH ( 0, 6001 ); + + return 0; /*NOTREACHED*/ +} + + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzDecompressEnd) ( bz_stream *strm ) +{ + DState* s; + if (strm == NULL) return BZ_PARAM_ERROR; + s = strm->state; + if (s == NULL) return BZ_PARAM_ERROR; + if (s->strm != strm) return BZ_PARAM_ERROR; + + if (s->tt != NULL) BZFREE(s->tt); + if (s->ll16 != NULL) BZFREE(s->ll16); + if (s->ll4 != NULL) BZFREE(s->ll4); + + BZFREE(strm->state); + strm->state = NULL; + + return BZ_OK; +} + + +#ifndef BZ_NO_STDIO +/*---------------------------------------------------*/ +/*--- File I/O stuff ---*/ +/*---------------------------------------------------*/ + +#define BZ_SETERR(eee) \ +{ \ + if (bzerror != NULL) *bzerror = eee; \ + if (bzf != NULL) bzf->lastErr = eee; \ +} + +typedef + struct { + FILE* handle; + Char buf[BZ_MAX_UNUSED]; + Int32 bufN; + Bool writing; + bz_stream strm; + Int32 lastErr; + Bool initialisedOk; + } + bzFile; + + +/*---------------------------------------------*/ +static Bool myfeof ( FILE* f ) +{ + Int32 c = fgetc ( f ); + if (c == EOF) return True; + ungetc ( c, f ); + return False; +} + + +/*---------------------------------------------------*/ +BZFILE* BZ_API(BZ2_bzWriteOpen) + ( int* bzerror, + FILE* f, + int blockSize100k, + int verbosity, + int workFactor ) +{ + Int32 ret; + bzFile* bzf = NULL; + + BZ_SETERR(BZ_OK); + + if (f == NULL || + (blockSize100k < 1 || blockSize100k > 9) || + (workFactor < 0 || workFactor > 250) || + (verbosity < 0 || verbosity > 4)) + { BZ_SETERR(BZ_PARAM_ERROR); return NULL; }; + + if (ferror(f)) + { BZ_SETERR(BZ_IO_ERROR); return NULL; }; + + bzf = malloc ( sizeof(bzFile) ); + if (bzf == NULL) + { BZ_SETERR(BZ_MEM_ERROR); return NULL; }; + + BZ_SETERR(BZ_OK); + bzf->initialisedOk = False; + bzf->bufN = 0; + bzf->handle = f; + bzf->writing = True; + bzf->strm.bzalloc = NULL; + bzf->strm.bzfree = NULL; + bzf->strm.opaque = NULL; + + if (workFactor == 0) workFactor = 30; + ret = BZ2_bzCompressInit ( &(bzf->strm), blockSize100k, + verbosity, workFactor ); + if (ret != BZ_OK) + { BZ_SETERR(ret); free(bzf); return NULL; }; + + bzf->strm.avail_in = 0; + bzf->initialisedOk = True; + return bzf; +} + + + +/*---------------------------------------------------*/ +void BZ_API(BZ2_bzWrite) + ( int* bzerror, + BZFILE* b, + void* buf, + int len ) +{ + Int32 n, n2, ret; + bzFile* bzf = (bzFile*)b; + + BZ_SETERR(BZ_OK); + if (bzf == NULL || buf == NULL || len < 0) + { BZ_SETERR(BZ_PARAM_ERROR); return; }; + if (!(bzf->writing)) + { BZ_SETERR(BZ_SEQUENCE_ERROR); return; }; + if (ferror(bzf->handle)) + { BZ_SETERR(BZ_IO_ERROR); return; }; + + if (len == 0) + { BZ_SETERR(BZ_OK); return; }; + + bzf->strm.avail_in = len; + bzf->strm.next_in = buf; + + while (True) { + bzf->strm.avail_out = BZ_MAX_UNUSED; + bzf->strm.next_out = bzf->buf; + ret = BZ2_bzCompress ( &(bzf->strm), BZ_RUN ); + if (ret != BZ_RUN_OK) + { BZ_SETERR(ret); return; }; + + if (bzf->strm.avail_out < BZ_MAX_UNUSED) { + n = BZ_MAX_UNUSED - bzf->strm.avail_out; + n2 = fwrite ( (void*)(bzf->buf), sizeof(UChar), + n, bzf->handle ); + if (n != n2 || ferror(bzf->handle)) + { BZ_SETERR(BZ_IO_ERROR); return; }; + } + + if (bzf->strm.avail_in == 0) + { BZ_SETERR(BZ_OK); return; }; + } +} + + +/*---------------------------------------------------*/ +void BZ_API(BZ2_bzWriteClose) + ( int* bzerror, + BZFILE* b, + int abandon, + unsigned int* nbytes_in, + unsigned int* nbytes_out ) +{ + BZ2_bzWriteClose64 ( bzerror, b, abandon, + nbytes_in, NULL, nbytes_out, NULL ); +} + + +void BZ_API(BZ2_bzWriteClose64) + ( int* bzerror, + BZFILE* b, + int abandon, + unsigned int* nbytes_in_lo32, + unsigned int* nbytes_in_hi32, + unsigned int* nbytes_out_lo32, + unsigned int* nbytes_out_hi32 ) +{ + Int32 n, n2, ret; + bzFile* bzf = (bzFile*)b; + + if (bzf == NULL) + { BZ_SETERR(BZ_OK); return; }; + if (!(bzf->writing)) + { BZ_SETERR(BZ_SEQUENCE_ERROR); return; }; + if (ferror(bzf->handle)) + { BZ_SETERR(BZ_IO_ERROR); return; }; + + if (nbytes_in_lo32 != NULL) *nbytes_in_lo32 = 0; + if (nbytes_in_hi32 != NULL) *nbytes_in_hi32 = 0; + if (nbytes_out_lo32 != NULL) *nbytes_out_lo32 = 0; + if (nbytes_out_hi32 != NULL) *nbytes_out_hi32 = 0; + + if ((!abandon) && bzf->lastErr == BZ_OK) { + while (True) { + bzf->strm.avail_out = BZ_MAX_UNUSED; + bzf->strm.next_out = bzf->buf; + ret = BZ2_bzCompress ( &(bzf->strm), BZ_FINISH ); + if (ret != BZ_FINISH_OK && ret != BZ_STREAM_END) + { BZ_SETERR(ret); return; }; + + if (bzf->strm.avail_out < BZ_MAX_UNUSED) { + n = BZ_MAX_UNUSED - bzf->strm.avail_out; + n2 = fwrite ( (void*)(bzf->buf), sizeof(UChar), + n, bzf->handle ); + if (n != n2 || ferror(bzf->handle)) + { BZ_SETERR(BZ_IO_ERROR); return; }; + } + + if (ret == BZ_STREAM_END) break; + } + } + + if ( !abandon && !ferror ( bzf->handle ) ) { + fflush ( bzf->handle ); + if (ferror(bzf->handle)) + { BZ_SETERR(BZ_IO_ERROR); return; }; + } + + if (nbytes_in_lo32 != NULL) + *nbytes_in_lo32 = bzf->strm.total_in_lo32; + if (nbytes_in_hi32 != NULL) + *nbytes_in_hi32 = bzf->strm.total_in_hi32; + if (nbytes_out_lo32 != NULL) + *nbytes_out_lo32 = bzf->strm.total_out_lo32; + if (nbytes_out_hi32 != NULL) + *nbytes_out_hi32 = bzf->strm.total_out_hi32; + + BZ_SETERR(BZ_OK); + BZ2_bzCompressEnd ( &(bzf->strm) ); + free ( bzf ); +} + + +/*---------------------------------------------------*/ +BZFILE* BZ_API(BZ2_bzReadOpen) + ( int* bzerror, + FILE* f, + int verbosity, + int small, + void* unused, + int nUnused ) +{ + bzFile* bzf = NULL; + int ret; + + BZ_SETERR(BZ_OK); + + if (f == NULL || + (small != 0 && small != 1) || + (verbosity < 0 || verbosity > 4) || + (unused == NULL && nUnused != 0) || + (unused != NULL && (nUnused < 0 || nUnused > BZ_MAX_UNUSED))) + { BZ_SETERR(BZ_PARAM_ERROR); return NULL; }; + + if (ferror(f)) + { BZ_SETERR(BZ_IO_ERROR); return NULL; }; + + bzf = malloc ( sizeof(bzFile) ); + if (bzf == NULL) + { BZ_SETERR(BZ_MEM_ERROR); return NULL; }; + + BZ_SETERR(BZ_OK); + + bzf->initialisedOk = False; + bzf->handle = f; + bzf->bufN = 0; + bzf->writing = False; + bzf->strm.bzalloc = NULL; + bzf->strm.bzfree = NULL; + bzf->strm.opaque = NULL; + + while (nUnused > 0) { + bzf->buf[bzf->bufN] = *((UChar*)(unused)); bzf->bufN++; + unused = ((void*)( 1 + ((UChar*)(unused)) )); + nUnused--; + } + + ret = BZ2_bzDecompressInit ( &(bzf->strm), verbosity, small ); + if (ret != BZ_OK) + { BZ_SETERR(ret); free(bzf); return NULL; }; + + bzf->strm.avail_in = bzf->bufN; + bzf->strm.next_in = bzf->buf; + + bzf->initialisedOk = True; + return bzf; +} + + +/*---------------------------------------------------*/ +void BZ_API(BZ2_bzReadClose) ( int *bzerror, BZFILE *b ) +{ + bzFile* bzf = (bzFile*)b; + + BZ_SETERR(BZ_OK); + if (bzf == NULL) + { BZ_SETERR(BZ_OK); return; }; + + if (bzf->writing) + { BZ_SETERR(BZ_SEQUENCE_ERROR); return; }; + + if (bzf->initialisedOk) + (void)BZ2_bzDecompressEnd ( &(bzf->strm) ); + free ( bzf ); +} + + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzRead) + ( int* bzerror, + BZFILE* b, + void* buf, + int len ) +{ + Int32 n, ret; + bzFile* bzf = (bzFile*)b; + + BZ_SETERR(BZ_OK); + + if (bzf == NULL || buf == NULL || len < 0) + { BZ_SETERR(BZ_PARAM_ERROR); return 0; }; + + if (bzf->writing) + { BZ_SETERR(BZ_SEQUENCE_ERROR); return 0; }; + + if (len == 0) + { BZ_SETERR(BZ_OK); return 0; }; + + bzf->strm.avail_out = len; + bzf->strm.next_out = buf; + + while (True) { + + if (ferror(bzf->handle)) + { BZ_SETERR(BZ_IO_ERROR); return 0; }; + + if (bzf->strm.avail_in == 0 && !myfeof(bzf->handle)) { + n = fread ( bzf->buf, sizeof(UChar), + BZ_MAX_UNUSED, bzf->handle ); + if (ferror(bzf->handle)) + { BZ_SETERR(BZ_IO_ERROR); return 0; }; + bzf->bufN = n; + bzf->strm.avail_in = bzf->bufN; + bzf->strm.next_in = bzf->buf; + } + + ret = BZ2_bzDecompress ( &(bzf->strm) ); + + if (ret != BZ_OK && ret != BZ_STREAM_END) + { BZ_SETERR(ret); return 0; }; + + if (ret == BZ_OK && myfeof(bzf->handle) && + bzf->strm.avail_in == 0 && bzf->strm.avail_out > 0) + { BZ_SETERR(BZ_UNEXPECTED_EOF); return 0; }; + + if (ret == BZ_STREAM_END) + { BZ_SETERR(BZ_STREAM_END); + return len - bzf->strm.avail_out; }; + if (bzf->strm.avail_out == 0) + { BZ_SETERR(BZ_OK); return len; }; + + } + + return 0; /*not reached*/ +} + + +/*---------------------------------------------------*/ +void BZ_API(BZ2_bzReadGetUnused) + ( int* bzerror, + BZFILE* b, + void** unused, + int* nUnused ) +{ + bzFile* bzf = (bzFile*)b; + if (bzf == NULL) + { BZ_SETERR(BZ_PARAM_ERROR); return; }; + if (bzf->lastErr != BZ_STREAM_END) + { BZ_SETERR(BZ_SEQUENCE_ERROR); return; }; + if (unused == NULL || nUnused == NULL) + { BZ_SETERR(BZ_PARAM_ERROR); return; }; + + BZ_SETERR(BZ_OK); + *nUnused = bzf->strm.avail_in; + *unused = bzf->strm.next_in; +} +#endif + + +/*---------------------------------------------------*/ +/*--- Misc convenience stuff ---*/ +/*---------------------------------------------------*/ + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzBuffToBuffCompress) + ( char* dest, + unsigned int* destLen, + char* source, + unsigned int sourceLen, + int blockSize100k, + int verbosity, + int workFactor ) +{ + bz_stream strm; + int ret; + + if (dest == NULL || destLen == NULL || + source == NULL || + blockSize100k < 1 || blockSize100k > 9 || + verbosity < 0 || verbosity > 4 || + workFactor < 0 || workFactor > 250) + return BZ_PARAM_ERROR; + + if (workFactor == 0) workFactor = 30; + strm.bzalloc = NULL; + strm.bzfree = NULL; + strm.opaque = NULL; + ret = BZ2_bzCompressInit ( &strm, blockSize100k, + verbosity, workFactor ); + if (ret != BZ_OK) return ret; + + strm.next_in = source; + strm.next_out = dest; + strm.avail_in = sourceLen; + strm.avail_out = *destLen; + + ret = BZ2_bzCompress ( &strm, BZ_FINISH ); + if (ret == BZ_FINISH_OK) goto output_overflow; + if (ret != BZ_STREAM_END) goto errhandler; + + /* normal termination */ + *destLen -= strm.avail_out; + BZ2_bzCompressEnd ( &strm ); + return BZ_OK; + + output_overflow: + BZ2_bzCompressEnd ( &strm ); + return BZ_OUTBUFF_FULL; + + errhandler: + BZ2_bzCompressEnd ( &strm ); + return ret; +} + + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzBuffToBuffDecompress) + ( char* dest, + unsigned int* destLen, + char* source, + unsigned int sourceLen, + int small, + int verbosity ) +{ + bz_stream strm; + int ret; + + if (dest == NULL || destLen == NULL || + source == NULL || + (small != 0 && small != 1) || + verbosity < 0 || verbosity > 4) + return BZ_PARAM_ERROR; + + strm.bzalloc = NULL; + strm.bzfree = NULL; + strm.opaque = NULL; + ret = BZ2_bzDecompressInit ( &strm, verbosity, small ); + if (ret != BZ_OK) return ret; + + strm.next_in = source; + strm.next_out = dest; + strm.avail_in = sourceLen; + strm.avail_out = *destLen; + + ret = BZ2_bzDecompress ( &strm ); + if (ret == BZ_OK) goto output_overflow_or_eof; + if (ret != BZ_STREAM_END) goto errhandler; + + /* normal termination */ + *destLen -= strm.avail_out; + BZ2_bzDecompressEnd ( &strm ); + return BZ_OK; + + output_overflow_or_eof: + if (strm.avail_out > 0) { + BZ2_bzDecompressEnd ( &strm ); + return BZ_UNEXPECTED_EOF; + } else { + BZ2_bzDecompressEnd ( &strm ); + return BZ_OUTBUFF_FULL; + }; + + errhandler: + BZ2_bzDecompressEnd ( &strm ); + return ret; +} + + +/*---------------------------------------------------*/ +/*-- + Code contributed by Yoshioka Tsuneo + (QWF00133@niftyserve.or.jp/tsuneo-y@is.aist-nara.ac.jp), + to support better zlib compatibility. + This code is not _officially_ part of libbzip2 (yet); + I haven't tested it, documented it, or considered the + threading-safeness of it. + If this code breaks, please contact both Yoshioka and me. +--*/ +/*---------------------------------------------------*/ + +/*---------------------------------------------------*/ +/*-- + return version like "0.9.0c". +--*/ +const char * BZ_API(BZ2_bzlibVersion)(void) +{ + return BZ_VERSION; +} + + +#ifndef BZ_NO_STDIO +/*---------------------------------------------------*/ + +#if defined(_WIN32) || defined(OS2) || defined(MSDOS) +# include <fcntl.h> +# include <io.h> +# define SET_BINARY_MODE(file) setmode(fileno(file),O_BINARY) +#else +# define SET_BINARY_MODE(file) +#endif +static +BZFILE * bzopen_or_bzdopen + ( const char *path, /* no use when bzdopen */ + int fd, /* no use when bzdopen */ + const char *mode, + int open_mode) /* bzopen: 0, bzdopen:1 */ +{ + int bzerr; + char unused[BZ_MAX_UNUSED]; + int blockSize100k = 9; + int writing = 0; + char mode2[10] = ""; + FILE *fp = NULL; + BZFILE *bzfp = NULL; + int verbosity = 0; + int workFactor = 30; + int smallMode = 0; + int nUnused = 0; + + if (mode == NULL) return NULL; + while (*mode) { + switch (*mode) { + case 'r': + writing = 0; break; + case 'w': + writing = 1; break; + case 's': + smallMode = 1; break; + default: + if (isdigit((int)(*mode))) { + blockSize100k = *mode-BZ_HDR_0; + } + } + mode++; + } + strcat(mode2, writing ? "w" : "r" ); + strcat(mode2,"b"); /* binary mode */ + + if (open_mode==0) { + if (path==NULL || strcmp(path,"")==0) { + fp = (writing ? stdout : stdin); + SET_BINARY_MODE(fp); + } else { + fp = fopen(path,mode2); + } + } else { +#ifdef BZ_STRICT_ANSI + fp = NULL; +#else + fp = fdopen(fd,mode2); +#endif + } + if (fp == NULL) return NULL; + + if (writing) { + /* Guard against total chaos and anarchy -- JRS */ + if (blockSize100k < 1) blockSize100k = 1; + if (blockSize100k > 9) blockSize100k = 9; + bzfp = BZ2_bzWriteOpen(&bzerr,fp,blockSize100k, + verbosity,workFactor); + } else { + bzfp = BZ2_bzReadOpen(&bzerr,fp,verbosity,smallMode, + unused,nUnused); + } + if (bzfp == NULL) { + if (fp != stdin && fp != stdout) fclose(fp); + return NULL; + } + return bzfp; +} + + +/*---------------------------------------------------*/ +/*-- + open file for read or write. + ex) bzopen("file","w9") + case path="" or NULL => use stdin or stdout. +--*/ +BZFILE * BZ_API(BZ2_bzopen) + ( const char *path, + const char *mode ) +{ + return bzopen_or_bzdopen(path,-1,mode,/*bzopen*/0); +} + + +/*---------------------------------------------------*/ +BZFILE * BZ_API(BZ2_bzdopen) + ( int fd, + const char *mode ) +{ + return bzopen_or_bzdopen(NULL,fd,mode,/*bzdopen*/1); +} + + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzread) (BZFILE* b, void* buf, int len ) +{ + int bzerr, nread; + if (((bzFile*)b)->lastErr == BZ_STREAM_END) return 0; + nread = BZ2_bzRead(&bzerr,b,buf,len); + if (bzerr == BZ_OK || bzerr == BZ_STREAM_END) { + return nread; + } else { + return -1; + } +} + + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzwrite) (BZFILE* b, void* buf, int len ) +{ + int bzerr; + + BZ2_bzWrite(&bzerr,b,buf,len); + if(bzerr == BZ_OK){ + return len; + }else{ + return -1; + } +} + + +/*---------------------------------------------------*/ +int BZ_API(BZ2_bzflush) (BZFILE *b) +{ + /* do nothing now... */ + return 0; +} + + +/*---------------------------------------------------*/ +void BZ_API(BZ2_bzclose) (BZFILE* b) +{ + int bzerr; + FILE *fp = ((bzFile *)b)->handle; + + if (b==NULL) {return;} + if(((bzFile*)b)->writing){ + BZ2_bzWriteClose(&bzerr,b,0,NULL,NULL); + if(bzerr != BZ_OK){ + BZ2_bzWriteClose(NULL,b,1,NULL,NULL); + } + }else{ + BZ2_bzReadClose(&bzerr,b); + } + if(fp!=stdin && fp!=stdout){ + fclose(fp); + } +} + + +/*---------------------------------------------------*/ +/*-- + return last error code +--*/ +static char *bzerrorstrings[] = { + "OK" + ,"SEQUENCE_ERROR" + ,"PARAM_ERROR" + ,"MEM_ERROR" + ,"DATA_ERROR" + ,"DATA_ERROR_MAGIC" + ,"IO_ERROR" + ,"UNEXPECTED_EOF" + ,"OUTBUFF_FULL" + ,"CONFIG_ERROR" + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ +}; + + +const char * BZ_API(BZ2_bzerror) (BZFILE *b, int *errnum) +{ + int err = ((bzFile *)b)->lastErr; + + if(err>0) err = 0; + *errnum = err; + return bzerrorstrings[err*-1]; +} +#endif + + +/*-------------------------------------------------------------*/ +/*--- end bzlib.c ---*/ +/*-------------------------------------------------------------*/ + + +///////////////////////////////////////////////////////////////////// +///////////////////////////////////////////////////////////////////// + + +/* A test program written to test robustness to decompression of + corrupted data. Usage is + unzcrash filename + and the program will read the specified file, compress it (in memory), + and then repeatedly decompress it, each time with a different bit of + the compressed data inverted, so as to test all possible one-bit errors. + This should not cause any invalid memory accesses. If it does, + I want to know about it! + + p.s. As you can see from the above description, the process is + incredibly slow. A file of size eg 5KB will cause it to run for + many hours. +*/ + +//#include <stdio.h> +//#include <assert.h> +//#include "bzlib.h" + +#define M_BLOCK 1000000 + + +#define M_BLOCK_OUT (M_BLOCK + 1000000) + char inbuf[M_BLOCK]; + char outbuf[M_BLOCK_OUT]; + char zbuf[M_BLOCK + 600 + (M_BLOCK / 100)]; + +int nIn; +unsigned int nOut; +unsigned int nZ; + +#if 0 +static char *bzerrorstrings[] = { + "OK" + ,"SEQUENCE_ERROR" + ,"PARAM_ERROR" + ,"MEM_ERROR" + ,"DATA_ERROR" + ,"DATA_ERROR_MAGIC" + ,"IO_ERROR" + ,"UNEXPECTED_EOF" + ,"OUTBUFF_FULL" + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ +}; +#endif + +void flip_bit ( int bit ) +{ + int byteno = bit / 8; + int bitno = bit % 8; + UChar mask = 1 << bitno; + //fprintf ( stderr, "(byte %d bit %d mask %d)", + // byteno, bitno, (int)mask ); + zbuf[byteno] ^= mask; +} + +void set_inbuf ( void ) +{ + inbuf[0] = 0; + my_strcat(inbuf, "At her sixtieth birthday party, Margaret Thatcher "); + my_strcat(inbuf, "blew on the cake to light the candles.\n"); + my_strcat(inbuf, "This program, bzip2, the associated library libbzip2, and all\n"); + my_strcat(inbuf, "documentation, are copyright (C) 1996-2004 Julian R Seward. All\n"); + my_strcat(inbuf, "rights reserved.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "Redistribution and use in source and binary forms, with or without\n"); + my_strcat(inbuf, "modification, are permitted provided that the following conditions\n"); + my_strcat(inbuf, "are met:\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "1. Redistributions of source code must retain the above copyright\n"); + my_strcat(inbuf, " notice, this list of conditions and the following disclaimer.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "2. The origin of this software must not be misrepresented; you must\n"); + my_strcat(inbuf, " not claim that you wrote the original software. If you use this\n"); + my_strcat(inbuf, " software in a product, an acknowledgment in the product\n"); + my_strcat(inbuf, " documentation would be appreciated but is not required.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "3. Altered source versions must be plainly marked as such, and must\n"); + my_strcat(inbuf, " not be misrepresented as being the original software.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "4. The name of the author may not be used to endorse or promote\n"); + my_strcat(inbuf, " products derived from this software without specific prior written\n"); + my_strcat(inbuf, " permission.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS\n"); + my_strcat(inbuf, "OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED\n"); + my_strcat(inbuf, "WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE\n"); + my_strcat(inbuf, "ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY\n"); + my_strcat(inbuf, "DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL\n"); + my_strcat(inbuf, "DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE\n"); + my_strcat(inbuf, "GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS\n"); + my_strcat(inbuf, "INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,\n"); + my_strcat(inbuf, "WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING\n"); + my_strcat(inbuf, "NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS\n"); + my_strcat(inbuf, "SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.\n"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, "ababababababababababababababababababababababababababababababab"); + my_strcat(inbuf, " GNU GENERAL PUBLIC LICENSE\n"); + my_strcat(inbuf, " Version 2, June 1991\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " Copyright (C) 1989, 1991 Free Software Foundation, Inc.\n"); + my_strcat(inbuf, " 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA\n"); + my_strcat(inbuf, " Everyone is permitted to copy and distribute verbatim copies\n"); + my_strcat(inbuf, " of this license document, but changing it is not allowed.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " Preamble\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " The licenses for most software are designed to take away your\n"); + my_strcat(inbuf, "freedom to share and change it. By contrast, the GNU General Public\n"); + my_strcat(inbuf, "License is intended to guarantee your freedom to share and change free\n"); + my_strcat(inbuf, "software--to make sure the software is free for all its users. This\n"); + my_strcat(inbuf, "General Public License applies to most of the Free Software\n"); + my_strcat(inbuf, "Foundation's software and to any other program whose authors commit to\n"); + my_strcat(inbuf, "using it. (Some other Free Software Foundation software is covered by\n"); + my_strcat(inbuf, "the GNU Library General Public License instead.) You can apply it to\n"); + my_strcat(inbuf, "your programs, too.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " When we speak of free software, we are referring to freedom, not\n"); + my_strcat(inbuf, "price. Our General Public Licenses are designed to make sure that you\n"); + my_strcat(inbuf, "have the freedom to distribute copies of free software (and charge for\n"); + my_strcat(inbuf, "this service if you wish), that you receive source code or can get it\n"); + my_strcat(inbuf, "if you want it, that you can change the software or use pieces of it\n"); + my_strcat(inbuf, "in new free programs; and that you know you can do these things.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " To protect your rights, we need to make restrictions that forbid\n"); + my_strcat(inbuf, "anyone to deny you these rights or to ask you to surrender the rights.\n"); + my_strcat(inbuf, "These restrictions translate to certain responsibilities for you if you\n"); + my_strcat(inbuf, "distribute copies of the software, or if you modify it.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " For example, if you distribute copies of such a program, whether\n"); + my_strcat(inbuf, "gratis or for a fee, you must give the recipients all the rights that\n"); + my_strcat(inbuf, "you have. You must make sure that they, too, receive or can get the\n"); + my_strcat(inbuf, "source code. And you must show them these terms so they know their\n"); + my_strcat(inbuf, "rights.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " We protect your rights with two steps: (1) copyright the software, and\n"); + my_strcat(inbuf, "(2) offer you this license which gives you legal permission to copy,\n"); + my_strcat(inbuf, "distribute and/or modify the software.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " Also, for each author's protection and ours, we want to make certain\n"); + my_strcat(inbuf, "that everyone understands that there is no warranty for this free\n"); + my_strcat(inbuf, "software. If the software is modified by someone else and passed on, we\n"); + my_strcat(inbuf, "want its recipients to know that what they have is not the original, so\n"); + my_strcat(inbuf, "that any problems introduced by others will not reflect on the original\n"); + my_strcat(inbuf, "authors' reputations.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " Finally, any free program is threatened constantly by software\n"); + my_strcat(inbuf, "patents. We wish to avoid the danger that redistributors of a free\n"); + my_strcat(inbuf, "program will individually obtain patent licenses, in effect making the\n"); + my_strcat(inbuf, "program proprietary. To prevent this, we have made it clear that any\n"); + my_strcat(inbuf, "patent must be licensed for everyone's free use or not licensed at all.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " The precise terms and conditions for copying, distribution and\n"); + my_strcat(inbuf, "modification follow.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " GNU GENERAL PUBLIC LICENSE\n"); + my_strcat(inbuf, " TERMS AND CONDITIONS FOR COPYING, DISTRIBUTION AND MODIFICATION\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 0. This License applies to any program or other work which contains\n"); + my_strcat(inbuf, "a notice placed by the copyright holder saying it may be distributed\n"); + my_strcat(inbuf, "under the terms of this General Public License. The Program, below,\n"); + my_strcat(inbuf, "refers to any such program or work, and a work based on the Program\n"); + my_strcat(inbuf, "means either the Program or any derivative work under copyright law:\n"); + my_strcat(inbuf, "that is to say, a work containing the Program or a portion of it,\n"); + my_strcat(inbuf, "either verbatim or with modifications and/or translated into another\n"); + my_strcat(inbuf, "language. (Hereinafter, translation is included without limitation in\n"); + my_strcat(inbuf, "the term modification.) Each licensee is addressed as you.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "Activities other than copying, distribution and modification are not\n"); + my_strcat(inbuf, "covered by this License; they are outside its scope. The act of\n"); + my_strcat(inbuf, "running the Program is not restricted, and the output from the Program\n"); + my_strcat(inbuf, "is covered only if its contents constitute a work based on the\n"); + my_strcat(inbuf, "Program (independent of having been made by running the Program).\n"); + my_strcat(inbuf, "Whether that is true depends on what the Program does.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 1. You may copy and distribute verbatim copies of the Program's\n"); + my_strcat(inbuf, "source code as you receive it, in any medium, provided that you\n"); + my_strcat(inbuf, "conspicuously and appropriately publish on each copy an appropriate\n"); + my_strcat(inbuf, "copyright notice and disclaimer of warranty; keep intact all the\n"); + my_strcat(inbuf, "notices that refer to this License and to the absence of any warranty;\n"); + my_strcat(inbuf, "and give any other recipients of the Program a copy of this License\n"); + my_strcat(inbuf, "along with the Program.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "You may charge a fee for the physical act of transferring a copy, and\n"); + my_strcat(inbuf, "you may at your option offer warranty protection in exchange for a fee.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 2. You may modify your copy or copies of the Program or any portion\n"); + my_strcat(inbuf, "of it, thus forming a work based on the Program, and copy and\n"); + my_strcat(inbuf, "distribute such modifications or work under the terms of Section 1\n"); + my_strcat(inbuf, "above, provided that you also meet all of these conditions:\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " a) You must cause the modified files to carry prominent notices\n"); + my_strcat(inbuf, " stating that you changed the files and the date of any change.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " b) You must cause any work that you distribute or publish, that in\n"); + my_strcat(inbuf, " whole or in part contains or is derived from the Program or any\n"); + my_strcat(inbuf, " part thereof, to be licensed as a whole at no charge to all third\n"); + my_strcat(inbuf, " parties under the terms of this License.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " c) If the modified program normally reads commands interactively\n"); + my_strcat(inbuf, " when run, you must cause it, when started running for such\n"); + my_strcat(inbuf, " interactive use in the most ordinary way, to print or display an\n"); + my_strcat(inbuf, " announcement including an appropriate copyright notice and a\n"); + my_strcat(inbuf, " notice that there is no warranty (or else, saying that you provide\n"); + my_strcat(inbuf, " a warranty) and that users may redistribute the program under\n"); + my_strcat(inbuf, " these conditions, and telling the user how to view a copy of this\n"); + my_strcat(inbuf, " License. (Exception: if the Program itself is interactive but\n"); + my_strcat(inbuf, " does not normally print such an announcement, your work based on\n"); + my_strcat(inbuf, " the Program is not required to print an announcement.)\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "These requirements apply to the modified work as a whole. If\n"); + my_strcat(inbuf, "identifiable sections of that work are not derived from the Program,\n"); + my_strcat(inbuf, "and can be reasonably considered independent and separate works in\n"); + my_strcat(inbuf, "themselves, then this License, and its terms, do not apply to those\n"); + my_strcat(inbuf, "sections when you distribute them as separate works. But when you\n"); + my_strcat(inbuf, "distribute the same sections as part of a whole which is a work based\n"); + my_strcat(inbuf, "on the Program, the distribution of the whole must be on the terms of\n"); + my_strcat(inbuf, "this License, whose permissions for other licensees extend to the\n"); + my_strcat(inbuf, "entire whole, and thus to each and every part regardless of who wrote it.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "Thus, it is not the intent of this section to claim rights or contest\n"); + my_strcat(inbuf, "your rights to work written entirely by you; rather, the intent is to\n"); + my_strcat(inbuf, "exercise the right to control the distribution of derivative or\n"); + my_strcat(inbuf, "collective works based on the Program.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "In addition, mere aggregation of another work not based on the Program\n"); + my_strcat(inbuf, "with the Program (or with a work based on the Program) on a volume of\n"); + my_strcat(inbuf, "a storage or distribution medium does not bring the other work under\n"); + my_strcat(inbuf, "the scope of this License.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 3. You may copy and distribute the Program (or a work based on it,\n"); + my_strcat(inbuf, "under Section 2) in object code or executable form under the terms of\n"); + my_strcat(inbuf, "Sections 1 and 2 above provided that you also do one of the following:\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " a) Accompany it with the complete corresponding machine-readable\n"); + my_strcat(inbuf, " source code, which must be distributed under the terms of Sections\n"); + my_strcat(inbuf, " 1 and 2 above on a medium customarily used for software interchange; or,\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " b) Accompany it with a written offer, valid for at least three\n"); + my_strcat(inbuf, " years, to give any third party, for a charge no more than your\n"); + my_strcat(inbuf, " cost of physically performing source distribution, a complete\n"); + my_strcat(inbuf, " machine-readable copy of the corresponding source code, to be\n"); + my_strcat(inbuf, " distributed under the terms of Sections 1 and 2 above on a medium\n"); + my_strcat(inbuf, " customarily used for software interchange; or,\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " c) Accompany it with the information you received as to the offer\n"); + my_strcat(inbuf, " to distribute corresponding source code. (This alternative is\n"); + my_strcat(inbuf, " allowed only for noncommercial distribution and only if you\n"); + my_strcat(inbuf, " received the program in object code or executable form with such\n"); + my_strcat(inbuf, " an offer, in accord with Subsection b above.)\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "The source code for a work means the preferred form of the work for\n"); + my_strcat(inbuf, "making modifications to it. For an executable work, complete source\n"); + my_strcat(inbuf, "code means all the source code for all modules it contains, plus any\n"); + my_strcat(inbuf, "associated interface definition files, plus the scripts used to\n"); + my_strcat(inbuf, "control compilation and installation of the executable. However, as a\n"); + my_strcat(inbuf, "special exception, the source code distributed need not include\n"); + my_strcat(inbuf, "anything that is normally distributed (in either source or binary\n"); + my_strcat(inbuf, "form) with the major components (compiler, kernel, and so on) of the\n"); + my_strcat(inbuf, "operating system on which the executable runs, unless that component\n"); + my_strcat(inbuf, "itself accompanies the executable.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "If distribution of executable or object code is made by offering\n"); + my_strcat(inbuf, "access to copy from a designated place, then offering equivalent\n"); + my_strcat(inbuf, "access to copy the source code from the same place counts as\n"); + my_strcat(inbuf, "distribution of the source code, even though third parties are not\n"); + my_strcat(inbuf, "compelled to copy the source along with the object code.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 4. You may not copy, modify, sublicense, or distribute the Program\n"); + my_strcat(inbuf, "except as expressly provided under this License. Any attempt\n"); + my_strcat(inbuf, "otherwise to copy, modify, sublicense or distribute the Program is\n"); + my_strcat(inbuf, "void, and will automatically terminate your rights under this License.\n"); + my_strcat(inbuf, "However, parties who have received copies, or rights, from you under\n"); + my_strcat(inbuf, "this License will not have their licenses terminated so long as such\n"); + my_strcat(inbuf, "parties remain in full compliance.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 5. You are not required to accept this License, since you have not\n"); + my_strcat(inbuf, "signed it. However, nothing else grants you permission to modify or\n"); + my_strcat(inbuf, "distribute the Program or its derivative works. These actions are\n"); + my_strcat(inbuf, "prohibited by law if you do not accept this License. Therefore, by\n"); + my_strcat(inbuf, "modifying or distributing the Program (or any work based on the\n"); + my_strcat(inbuf, "Program), you indicate your acceptance of this License to do so, and\n"); + my_strcat(inbuf, "all its terms and conditions for copying, distributing or modifying\n"); + my_strcat(inbuf, "the Program or works based on it.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 6. Each time you redistribute the Program (or any work based on the\n"); + my_strcat(inbuf, "Program), the recipient automatically receives a license from the\n"); + my_strcat(inbuf, "original licensor to copy, distribute or modify the Program subject to\n"); + my_strcat(inbuf, "these terms and conditions. You may not impose any further\n"); + my_strcat(inbuf, "restrictions on the recipients' exercise of the rights granted herein.\n"); + my_strcat(inbuf, "You are not responsible for enforcing compliance by third parties to\n"); + my_strcat(inbuf, "this License.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 7. If, as a consequence of a court judgment or allegation of patent\n"); + my_strcat(inbuf, "infringement or for any other reason (not limited to patent issues),\n"); + my_strcat(inbuf, "conditions are imposed on you (whether by court order, agreement or\n"); + my_strcat(inbuf, "otherwise) that contradict the conditions of this License, they do not\n"); + my_strcat(inbuf, "excuse you from the conditions of this License. If you cannot\n"); + my_strcat(inbuf, "distribute so as to satisfy simultaneously your obligations under this\n"); + my_strcat(inbuf, "License and any other pertinent obligations, then as a consequence you\n"); + my_strcat(inbuf, "may not distribute the Program at all. For example, if a patent\n"); + my_strcat(inbuf, "license would not permit royalty-free redistribution of the Program by\n"); + my_strcat(inbuf, "all those who receive copies directly or indirectly through you, then\n"); + my_strcat(inbuf, "the only way you could satisfy both it and this License would be to\n"); + my_strcat(inbuf, "refrain entirely from distribution of the Program.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "If any portion of this section is held invalid or unenforceable under\n"); + my_strcat(inbuf, "any particular circumstance, the balance of the section is intended to\n"); + my_strcat(inbuf, "apply and the section as a whole is intended to apply in other\n"); + my_strcat(inbuf, "circumstances.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "It is not the purpose of this section to induce you to infringe any\n"); + my_strcat(inbuf, "patents or other property right claims or to contest validity of any\n"); + my_strcat(inbuf, "such claims; this section has the sole purpose of protecting the\n"); + my_strcat(inbuf, "integrity of the free software distribution system, which is\n"); + my_strcat(inbuf, "implemented by public license practices. Many people have made\n"); + my_strcat(inbuf, "generous contributions to the wide range of software distributed\n"); + my_strcat(inbuf, "through that system in reliance on consistent application of that\n"); + my_strcat(inbuf, "system; it is up to the author/donor to decide if he or she is willing\n"); + my_strcat(inbuf, "to distribute software through any other system and a licensee cannot\n"); + my_strcat(inbuf, "impose that choice.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "This section is intended to make thoroughly clear what is believed to\n"); + my_strcat(inbuf, "be a consequence of the rest of this License.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 8. If the distribution and/or use of the Program is restricted in\n"); + my_strcat(inbuf, "certain countries either by patents or by copyrighted interfaces, the\n"); + my_strcat(inbuf, "original copyright holder who places the Program under this License\n"); + my_strcat(inbuf, "may add an explicit geographical distribution limitation excluding\n"); + my_strcat(inbuf, "those countries, so that distribution is permitted only in or among\n"); + my_strcat(inbuf, "countries not thus excluded. In such case, this License incorporates\n"); + my_strcat(inbuf, "the limitation as if written in the body of this License.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 9. The Free Software Foundation may publish revised and/or new versions\n"); + my_strcat(inbuf, "of the General Public License from time to time. Such new versions will\n"); + my_strcat(inbuf, "be similar in spirit to the present version, but may differ in detail to\n"); + my_strcat(inbuf, "address new problems or concerns.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "Each version is given a distinguishing version number. If the Program\n"); + my_strcat(inbuf, "specifies a version number of this License which applies to it and any\n"); + my_strcat(inbuf, "later version, you have the option of following the terms and conditions\n"); + my_strcat(inbuf, "either of that version or of any later version published by the Free\n"); + my_strcat(inbuf, "Software Foundation. If the Program does not specify a version number of\n"); + my_strcat(inbuf, "this License, you may choose any version ever published by the Free Software\n"); + my_strcat(inbuf, "Foundation.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 10. If you wish to incorporate parts of the Program into other free\n"); + my_strcat(inbuf, "programs whose distribution conditions are different, write to the author\n"); + my_strcat(inbuf, "to ask for permission. For software which is copyrighted by the Free\n"); + my_strcat(inbuf, "Software Foundation, write to the Free Software Foundation; we sometimes\n"); + my_strcat(inbuf, "make exceptions for this. Our decision will be guided by the two goals\n"); + my_strcat(inbuf, "of preserving the free status of all derivatives of our free software and\n"); + my_strcat(inbuf, "of promoting the sharing and reuse of software generally.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " NO WARRANTY\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 11. BECAUSE THE PROGRAM IS LICENSED FREE OF CHARGE, THERE IS NO WARRANTY\n"); + my_strcat(inbuf, "FOR THE PROGRAM, TO THE EXTENT PERMITTED BY APPLICABLE LAW. EXCEPT WHEN\n"); + my_strcat(inbuf, "OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES\n"); + my_strcat(inbuf, "PROVIDE THE PROGRAM AS IS WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED\n"); + my_strcat(inbuf, "OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF\n"); + my_strcat(inbuf, "MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS\n"); + my_strcat(inbuf, "TO THE QUALITY AND PERFORMANCE OF THE PROGRAM IS WITH YOU. SHOULD THE\n"); + my_strcat(inbuf, "PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF ALL NECESSARY SERVICING,\n"); + my_strcat(inbuf, "REPAIR OR CORRECTION.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " 12. IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING\n"); + my_strcat(inbuf, "WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MAY MODIFY AND/OR\n"); + my_strcat(inbuf, "REDISTRIBUTE THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES,\n"); + my_strcat(inbuf, "INCLUDING ANY GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING\n"); + my_strcat(inbuf, "OUT OF THE USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED\n"); + my_strcat(inbuf, "TO LOSS OF DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY\n"); + my_strcat(inbuf, "YOU OR THIRD PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER\n"); + my_strcat(inbuf, "PROGRAMS), EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE\n"); + my_strcat(inbuf, "POSSIBILITY OF SUCH DAMAGES.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " END OF TERMS AND CONDITIONS\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " How to Apply These Terms to Your New Programs\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " If you develop a new program, and you want it to be of the greatest\n"); + my_strcat(inbuf, "possible use to the public, the best way to achieve this is to make it\n"); + my_strcat(inbuf, "free software which everyone can redistribute and change under these terms.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " To do so, attach the following notices to the program. It is safest\n"); + my_strcat(inbuf, "to attach them to the start of each source file to most effectively\n"); + my_strcat(inbuf, "convey the exclusion of warranty; and each file should have at least\n"); + my_strcat(inbuf, "the copyright line and a pointer to where the full notice is found.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " <one line to give the program's name and a brief idea of what it does.>\n"); + my_strcat(inbuf, " Copyright (C) <year> <name of author>\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " This program is free software; you can redistribute it and/or modify\n"); + my_strcat(inbuf, " it under the terms of the GNU General Public License as published by\n"); + my_strcat(inbuf, " the Free Software Foundation; either version 2 of the License, or\n"); + my_strcat(inbuf, " (at your option) any later version.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " This program is distributed in the hope that it will be useful,\n"); + my_strcat(inbuf, " but WITHOUT ANY WARRANTY; without even the implied warranty of\n"); + my_strcat(inbuf, " MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the\n"); + my_strcat(inbuf, " GNU General Public License for more details.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " You should have received a copy of the GNU General Public License\n"); + my_strcat(inbuf, " along with this program; if not, write to the Free Software\n"); + my_strcat(inbuf, " Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "Also add information on how to contact you by electronic and paper mail.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "If the program is interactive, make it output a short notice like this\n"); + my_strcat(inbuf, "when it starts in an interactive mode:\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " Gnomovision version 69, Copyright (C) year name of author\n"); + my_strcat(inbuf, " Gnomovision comes with ABSOLUTELY NO WARRANTY; for details type `show w'.\n"); + my_strcat(inbuf, " This is free software, and you are welcome to redistribute it\n"); + my_strcat(inbuf, " under certain conditions; type `show c' for details.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "The hypothetical commands `show w' and `show c' should show the appropriate\n"); + my_strcat(inbuf, "parts of the General Public License. Of course, the commands you use may\n"); + my_strcat(inbuf, "be called something other than `show w' and `show c'; they could even be\n"); + my_strcat(inbuf, "mouse-clicks or menu items--whatever suits your program.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "You should also get your employer (if you work as a programmer) or your\n"); + my_strcat(inbuf, "school, if any, to sign a copyright disclaimer for the program, if\n"); + my_strcat(inbuf, "necessary. Here is a sample; alter the names:\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " Yoyodyne, Inc., hereby disclaims all copyright interest in the program\n"); + my_strcat(inbuf, " `Gnomovision' (which makes passes at compilers) written by James Hacker.\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, " <signature of Ty Coon>, 1 April 1989\n"); + my_strcat(inbuf, " Ty Coon, President of Vice\n"); + my_strcat(inbuf, "\n"); + my_strcat(inbuf, "This General Public License does not permit incorporating your program into\n"); + my_strcat(inbuf, "proprietary programs. If your program is a subroutine library, you may\n"); + my_strcat(inbuf, "consider it more useful to permit linking proprietary applications with the\n"); + my_strcat(inbuf, "library. If this is what you want to do, use the GNU Library General\n"); + my_strcat(inbuf, "Public License instead of this License.\n"); + + my_strcat(inbuf, "\n"); +} + +#include <stdio.h> +#include <assert.h> + +/* For providing services. */ +static HWord g_serviceFn ( HWord arg1, HWord arg2 ) +{ + switch (arg1) { + case 0: /* EXIT */ + exit(0); + case 1: /* PUTC */ + putchar(arg2); + return 0; + case 2: /* MALLOC */ + return (HWord)malloc(arg2); + case 3: /* FREE */ + free((void*)arg2); + return 0; + default: + assert(0); + } +} + +static char *bzerrorstrings[] = { + "OK" + ,"SEQUENCE_ERROR" + ,"PARAM_ERROR" + ,"MEM_ERROR" + ,"DATA_ERROR" + ,"DATA_ERROR_MAGIC" + ,"IO_ERROR" + ,"UNEXPECTED_EOF" + ,"OUTBUFF_FULL" + ,"CONFIG_ERROR" + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ + ,"???" /* for future */ +}; + +// If given a cmd line arg, behave as a correctness regtest +// (run fast and be verbose). If not, run for a long time +// which is what is needed for the performance suite. +int main ( int argc, char** argv ) +{ + int r; + int bit; + int i; + + int regtest; + assert(argc == 1 || argc == 2); + regtest = argc==2; + regtest = 1; + serviceFn = g_serviceFn; + + set_inbuf(); + nIn = vex_strlen(inbuf)+1; + vex_printf( "%d bytes read\n", nIn ); + + nZ = M_BLOCK; + r = BZ2_bzBuffToBuffCompress ( + zbuf, &nZ, inbuf, nIn, 9, 3/*verb*/, 30 ); + + if (r != BZ_OK) { + vex_printf("initial compress failed!\n"); + (*serviceFn)(0,0); + } + vex_printf( "%d after compression\n", nZ ); + + for (bit = 0; bit < nZ*8; bit += (bit < 35 ? 1 : (regtest?2377:137))) { + if (regtest) + vex_printf( "bit %d ", bit ); + flip_bit ( bit ); + nOut = M_BLOCK_OUT; + r = BZ2_bzBuffToBuffDecompress ( + outbuf, &nOut, zbuf, nZ, 1/*small*/, 0 ); + if (regtest) + vex_printf( " %d %s ", r, bzerrorstrings[-r] ); + + if (r != BZ_OK) { + if (regtest) + vex_printf( "\n" ); + } else { + if (nOut != nIn) { + vex_printf( "nIn/nOut mismatch %d %d\n", nIn, nOut ); + (*serviceFn)(0,0); + } else { + for (i = 0; i < nOut; i++) + if (inbuf[i] != outbuf[i]) { + vex_printf( "mismatch at %d\n", i ); + (*serviceFn)(0,0); + } + if (i == nOut) vex_printf( "really ok!\n" ); + } + } + + flip_bit ( bit ); + } + +#if 0 + assert (nOut == nIn); + for (i = 0; i < nOut; i++) { + if (inbuf[i] != outbuf[i]) { + vex_printf( "difference at %d !\n", i ); + return 1; + } + } +#endif + + vex_printf( "all ok\n" ); + (*serviceFn)(0,0); + /*NOTREACHED*/ + return 0; +} diff --git a/exp-sgcheck/tests/hackedbz2.stderr.exp-glibc28-amd64 b/exp-sgcheck/tests/hackedbz2.stderr.exp-glibc28-amd64 new file mode 100644 index 00000000..43c3c0da --- /dev/null +++ b/exp-sgcheck/tests/hackedbz2.stderr.exp-glibc28-amd64 @@ -0,0 +1,16 @@ + +Invalid read of size 1 + at 0x........: vex_strlen (hackedbz2.c:1006) + by 0x........: add_to_myprintf_buf (hackedbz2.c:1284) + by 0x........: vex_printf (hackedbz2.c:1155) + by 0x........: BZ2_compressBlock (hackedbz2.c:4039) + by 0x........: handle_compress (hackedbz2.c:4761) + by 0x........: BZ2_bzCompress (hackedbz2.c:4831) + by 0x........: BZ2_bzBuffToBuffCompress (hackedbz2.c:5638) + by 0x........: main (hackedbz2.c:6484) + Address 0x........ expected vs actual: + Expected: global array "myprintf_buf" in object with soname "NONE" + Actual: unknown + + +ERROR SUMMARY: 1 errors from 1 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/hackedbz2.stdout.exp b/exp-sgcheck/tests/hackedbz2.stdout.exp new file mode 100644 index 00000000..3bfc54ec --- /dev/null +++ b/exp-sgcheck/tests/hackedbz2.stdout.exp @@ -0,0 +1,70 @@ +22323 bytes read + block 1: crc = 0xA212ABF8, combined CRC = 0xA212ABF8, size = 22373 + too repetitive; using fallback sorting algorithm + 22373 in block, 13504 after MTF & 1-2 coding, 79+2 syms in use + pass 1: size is 17143, grp uses are 38 62 2 92 6 71 + pass 2: size is 6506, grp uses are 28 71 0 86 9 77 + pass 3: size is 6479, grp uses are 26 70 0 81 11 83 + pass 4: size is 6469, grp uses are 26 69 0 74 17 85 + bytes: mapping 19, selectors 66, code lengths 134, codes 6465 + final combined CRC = 0xA212ABF8 + 6710 after compression +bit 0 -5 DATA_ERROR_MAGIC +bit 1 -5 DATA_ERROR_MAGIC +bit 2 -5 DATA_ERROR_MAGIC +bit 3 -5 DATA_ERROR_MAGIC +bit 4 -5 DATA_ERROR_MAGIC +bit 5 -5 DATA_ERROR_MAGIC +bit 6 -5 DATA_ERROR_MAGIC +bit 7 -5 DATA_ERROR_MAGIC +bit 8 -5 DATA_ERROR_MAGIC +bit 9 -5 DATA_ERROR_MAGIC +bit 10 -5 DATA_ERROR_MAGIC +bit 11 -5 DATA_ERROR_MAGIC +bit 12 -5 DATA_ERROR_MAGIC +bit 13 -5 DATA_ERROR_MAGIC +bit 14 -5 DATA_ERROR_MAGIC +bit 15 -5 DATA_ERROR_MAGIC +bit 16 -5 DATA_ERROR_MAGIC +bit 17 -5 DATA_ERROR_MAGIC +bit 18 -5 DATA_ERROR_MAGIC +bit 19 -5 DATA_ERROR_MAGIC +bit 20 -5 DATA_ERROR_MAGIC +bit 21 -5 DATA_ERROR_MAGIC +bit 22 -5 DATA_ERROR_MAGIC +bit 23 -5 DATA_ERROR_MAGIC +bit 24 0 OK really ok! +bit 25 -5 DATA_ERROR_MAGIC +bit 26 -5 DATA_ERROR_MAGIC +bit 27 0 OK really ok! +bit 28 -5 DATA_ERROR_MAGIC +bit 29 -5 DATA_ERROR_MAGIC +bit 30 -5 DATA_ERROR_MAGIC +bit 31 -5 DATA_ERROR_MAGIC +bit 32 -4 DATA_ERROR +bit 33 -4 DATA_ERROR +bit 34 -4 DATA_ERROR +bit 35 -4 DATA_ERROR +bit 2412 -4 DATA_ERROR +bit 4789 -4 DATA_ERROR +bit 7166 -4 DATA_ERROR +bit 9543 -4 DATA_ERROR +bit 11920 -4 DATA_ERROR +bit 14297 -4 DATA_ERROR +bit 16674 -4 DATA_ERROR +bit 19051 -4 DATA_ERROR +bit 21428 -4 DATA_ERROR +bit 23805 -4 DATA_ERROR +bit 26182 -4 DATA_ERROR +bit 28559 -4 DATA_ERROR +bit 30936 -4 DATA_ERROR +bit 33313 -4 DATA_ERROR +bit 35690 -4 DATA_ERROR +bit 38067 -4 DATA_ERROR +bit 40444 -4 DATA_ERROR +bit 42821 -4 DATA_ERROR +bit 45198 -4 DATA_ERROR +bit 47575 -4 DATA_ERROR +bit 49952 -4 DATA_ERROR +bit 52329 -4 DATA_ERROR +all ok diff --git a/exp-sgcheck/tests/hackedbz2.vgtest b/exp-sgcheck/tests/hackedbz2.vgtest new file mode 100644 index 00000000..ea8f5e8c --- /dev/null +++ b/exp-sgcheck/tests/hackedbz2.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: hackedbz2 diff --git a/exp-sgcheck/tests/hp_bounds.c b/exp-sgcheck/tests/hp_bounds.c new file mode 100644 index 00000000..e456cabe --- /dev/null +++ b/exp-sgcheck/tests/hp_bounds.c @@ -0,0 +1,13 @@ +#include <stdlib.h> + +int main(void) +{ + int y __attribute__((unused)); + int* x = malloc(sizeof(int) * 100); + + y = x[95]; // ok + y = x[100]; // overrun + y = x[-1]; // underrun + + return 0; +} diff --git a/exp-sgcheck/tests/hp_bounds.stderr.exp b/exp-sgcheck/tests/hp_bounds.stderr.exp new file mode 100644 index 00000000..28121b82 --- /dev/null +++ b/exp-sgcheck/tests/hp_bounds.stderr.exp @@ -0,0 +1,17 @@ + +Invalid read of size 4 + at 0x........: main (hp_bounds.c:9) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 400 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (hp_bounds.c:6) + +Invalid read of size 4 + at 0x........: main (hp_bounds.c:10) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 400 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (hp_bounds.c:6) + + +ERROR SUMMARY: 2 errors from 2 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/hp_bounds.vgtest b/exp-sgcheck/tests/hp_bounds.vgtest new file mode 100644 index 00000000..96a983e5 --- /dev/null +++ b/exp-sgcheck/tests/hp_bounds.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: hp_bounds diff --git a/exp-sgcheck/tests/hp_dangle.c b/exp-sgcheck/tests/hp_dangle.c new file mode 100644 index 00000000..31470df4 --- /dev/null +++ b/exp-sgcheck/tests/hp_dangle.c @@ -0,0 +1,21 @@ + +#include <stdlib.h> + +int* mk_dangle(void) +{ + int* x = malloc(400); + free(x); + + return x; +} + +int main(void) +{ + int y __attribute__((unused)); + int* x = mk_dangle(); + + y = x[5]; + y = x[-1]; + + return 0; +} diff --git a/exp-sgcheck/tests/hp_dangle.stderr.exp b/exp-sgcheck/tests/hp_dangle.stderr.exp new file mode 100644 index 00000000..21420276 --- /dev/null +++ b/exp-sgcheck/tests/hp_dangle.stderr.exp @@ -0,0 +1,19 @@ + +Invalid read of size 4 + at 0x........: main (hp_dangle.c:17) + Address 0x........ is 20 bytes inside the accessing pointer's + once-legitimate range, a block of size 400 free'd + at 0x........: free (vg_replace_malloc.c:...) + by 0x........: mk_dangle (hp_dangle.c:7) + by 0x........: main (hp_dangle.c:15) + +Doubly-invalid read of size 4 + at 0x........: main (hp_dangle.c:18) + Address 0x........ is 4 bytes before the accessing pointer's + once-legitimate range, a block of size 400 free'd + at 0x........: free (vg_replace_malloc.c:...) + by 0x........: mk_dangle (hp_dangle.c:7) + by 0x........: main (hp_dangle.c:15) + + +ERROR SUMMARY: 2 errors from 2 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/hp_dangle.vgtest b/exp-sgcheck/tests/hp_dangle.vgtest new file mode 100644 index 00000000..42cbe6c5 --- /dev/null +++ b/exp-sgcheck/tests/hp_dangle.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: hp_dangle diff --git a/exp-sgcheck/tests/hsg.c b/exp-sgcheck/tests/hsg.c new file mode 100644 index 00000000..7f497b46 --- /dev/null +++ b/exp-sgcheck/tests/hsg.c @@ -0,0 +1,48 @@ + +/* A simple test to demonstrate heap, stack, and global overrun + detection. */ + +#include <stdio.h> +#include <stdlib.h> + +short ga[100]; + +__attribute__((noinline)) +int addup_wrongly ( short* arr ) +{ + int sum = 0, i; + for (i = 0; i <= 100; i++) + sum += (int)arr[i]; + return sum; +} + +__attribute__((noinline)) +int do_other_stuff ( void ) +{ + short la[100]; + return 123 + addup_wrongly(la); +} + +__attribute__((noinline)) +int do_stupid_malloc_stuff ( void ) +{ + int sum = 0; + unsigned char* duh = malloc(100 * sizeof(char)); + sum += duh[-1]; + free(duh); + sum += duh[50]; + return sum; +} + +int main ( void ) +{ + long s = addup_wrongly(ga); + s += do_other_stuff(); + s += do_stupid_malloc_stuff(); + if (s == 123456789) { + fprintf(stdout, "well, i never!\n"); + } else { + fprintf(stdout, "boringly as expected\n"); + } + return 0; +} diff --git a/exp-sgcheck/tests/hsg.stderr.exp b/exp-sgcheck/tests/hsg.stderr.exp new file mode 100644 index 00000000..acbc5a9c --- /dev/null +++ b/exp-sgcheck/tests/hsg.stderr.exp @@ -0,0 +1,230 @@ +<?xml version="1.0"?> + +<valgrindoutput> + +<protocolversion>4</protocolversion> +<protocoltool>exp-ptrcheck</protocoltool> + +<preamble> + <line>...</line> + <line>...</line> + <line>...</line> + <line>...</line> + <line>...</line> +</preamble> + +<pid>...</pid> +<ppid>...</ppid> +<tool>exp-ptrcheck</tool> + +<args> + <vargv>...</vargv> + <argv> + <exe>./hsg</exe> + </argv> +</args> + +<status> + <state>RUNNING</state> + <time>...</time> +</status> + +<error> + <unique>0x........</unique> + <tid>...</tid> + <kind>SorG</kind> + <what>Invalid read of size 2</what> + <stack> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>addup_wrongly</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>main</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + </stack> + <auxwhat>Address 0x........ expected vs actual:</auxwhat> + <auxwhat>Expected: global array "ga" in object with soname "NONE"</auxwhat> + <auxwhat>Actual: unknown</auxwhat> +</error> + +<error> + <unique>0x........</unique> + <tid>...</tid> + <kind>SorG</kind> + <what>Invalid read of size 2</what> + <stack> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>addup_wrongly</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>do_other_stuff</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>main</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + </stack> + <auxwhat>Address 0x........ expected vs actual:</auxwhat> + <auxwhat>Expected: stack array "la" in frame 1 back from here</auxwhat> + <auxwhat>Actual: unknown</auxwhat> +</error> + +<error> + <unique>0x........</unique> + <tid>...</tid> + <kind>Heap</kind> + <what>Invalid read of size 1</what> + <stack> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>do_stupid_malloc_stuff</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>main</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + </stack> + <auxwhat>Address 0x........ is 1 bytes before the accessing pointer's</auxwhat> + <auxwhat>legitimate range, a block of size 100 alloc'd</auxwhat> + <stack> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>malloc</fn> + <dir>...</dir> + <file>vg_replace_malloc.c</file> + <line>...</line> + </frame> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>do_stupid_malloc_stuff</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>main</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + </stack> +</error> + +<error> + <unique>0x........</unique> + <tid>...</tid> + <kind>Heap</kind> + <what>Invalid read of size 1</what> + <stack> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>do_stupid_malloc_stuff</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>main</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + </stack> + <auxwhat>Address 0x........ is 50 bytes inside the accessing pointer's</auxwhat> + <auxwhat>once-legitimate range, a block of size 100 free'd</auxwhat> + <stack> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>free</fn> + <dir>...</dir> + <file>vg_replace_malloc.c</file> + <line>...</line> + </frame> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>do_stupid_malloc_stuff</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + <frame> + <ip>0x........</ip> + <obj>...</obj> + <fn>main</fn> + <dir>...</dir> + <file>hsg.c</file> + <line>...</line> + </frame> + </stack> +</error> + + +<status> + <state>FINISHED</state> + <time>...</time> +</status> + +<errorcounts> + <pair> + <count>...</count> + <unique>0x........</unique> + </pair> + <pair> + <count>...</count> + <unique>0x........</unique> + </pair> + <pair> + <count>...</count> + <unique>0x........</unique> + </pair> + <pair> + <count>...</count> + <unique>0x........</unique> + </pair> +</errorcounts> + +<suppcounts>...</suppcounts> + +</valgrindoutput> + diff --git a/exp-sgcheck/tests/hsg.stdout.exp b/exp-sgcheck/tests/hsg.stdout.exp new file mode 100644 index 00000000..e5b8e6d6 --- /dev/null +++ b/exp-sgcheck/tests/hsg.stdout.exp @@ -0,0 +1 @@ +boringly as expected diff --git a/exp-sgcheck/tests/hsg.vgtest b/exp-sgcheck/tests/hsg.vgtest new file mode 100644 index 00000000..b6f65366 --- /dev/null +++ b/exp-sgcheck/tests/hsg.vgtest @@ -0,0 +1,4 @@ +prereq: ./is_arch_supported +prog: hsg +vgopts: --xml=yes --xml-fd=2 --log-file=/dev/null +stderr_filter: ../../memcheck/tests/filter_xml diff --git a/exp-sgcheck/tests/idiv.c b/exp-sgcheck/tests/idiv.c new file mode 100644 index 00000000..f4ecb9c2 --- /dev/null +++ b/exp-sgcheck/tests/idiv.c @@ -0,0 +1,40 @@ +#include <stdio.h> +#include <stdlib.h> +#include <signal.h> +#include <setjmp.h> +#include <assert.h> + +#include "arith_include1.c" + +int main(void) +{ + #include "arith_include2.c" + + // ADD ========================================================= + g(/, n, n2, n); // det, det + + g(/, n, p, e); // detected bad idiv; det, det + + g(/, p, n2, n); // ok, det + + g(/, p, p, e); // detected bad idiv; det, det + + g(/, n, un, n); // undet, undet + g(/, n, up, n); // undetected bad idiv; ok, undet + + g(/, un, n2, n); // undet, undet + g(/, up, n2, n); // ok, undet + + g(/, un, un, n); // undet, undet + g(/, un, up, n); // undetected bad idiv; undet, undet + g(/, up, un, n); // undet, undet + g(/, up, up, n); // undetected bad idiv; undet, undet + + g(/, un, p, n); // detected bad idiv; undet, undet + g(/, up, p, n); // detected bad idiv; undet, undet + + g(/, p, un, n); // undet, undet + g(/, p, up, n); // undetected bad idiv; undet, undet + + return 0; +} diff --git a/exp-sgcheck/tests/idiv.stderr.exp b/exp-sgcheck/tests/idiv.stderr.exp new file mode 100644 index 00000000..92e93911 --- /dev/null +++ b/exp-sgcheck/tests/idiv.stderr.exp @@ -0,0 +1,270 @@ + +about to do 14 [0] +Invalid read of size 4 + at 0x........: main (idiv.c:14) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 14 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:14) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block + +Invalid IDIV + at 0x........: main (idiv.c:16) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First arg not a pointer +Second arg derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +about to do 16 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:16) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 16 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:16) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 18 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:18) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 18 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:18) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block + +Invalid IDIV + at 0x........: main (idiv.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Both args derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +about to do 20 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 20 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 22 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:22) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 22 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:22) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 23 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:23) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 23 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:23) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 25 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:25) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 25 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:25) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 26 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:26) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 26 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:26) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 28 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:28) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 28 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:28) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 29 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:29) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 29 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:29) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 30 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:30) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 30 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:30) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 31 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:31) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 31 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:31) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block + +Invalid IDIV + at 0x........: main (idiv.c:33) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First arg may be a pointer +Second arg derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +about to do 33 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:33) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 33 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:33) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block + +Invalid IDIV + at 0x........: main (idiv.c:34) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First arg may be a pointer +Second arg derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +about to do 34 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:34) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 34 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:34) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 36 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:36) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 36 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:36) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 37 [0] + +Invalid read of size 4 + at 0x........: main (idiv.c:37) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 37 [-1] + +Invalid read of size 4 + at 0x........: main (idiv.c:37) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block + + +ERROR SUMMARY: 36 errors from 36 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/idiv.vgtest-disabled b/exp-sgcheck/tests/idiv.vgtest-disabled new file mode 100644 index 00000000..e8aa9bb2 --- /dev/null +++ b/exp-sgcheck/tests/idiv.vgtest-disabled @@ -0,0 +1,2 @@ +prog: idiv +stderr_filter: filter_add diff --git a/exp-sgcheck/tests/imul.c b/exp-sgcheck/tests/imul.c new file mode 100644 index 00000000..877c00ae --- /dev/null +++ b/exp-sgcheck/tests/imul.c @@ -0,0 +1,40 @@ +#include <stdio.h> +#include <stdlib.h> +#include <signal.h> +#include <setjmp.h> +#include <assert.h> + +#include "arith_include1.c" + +int main(void) +{ + #include "arith_include2.c" + + // ADD ========================================================= + g(*, n, n, n); // det, det + + g(*, n, p, n); // det, det + + g(*, p, n, n); // ok, det + + g(*, p, p, e); // detected bad mul; det, det + + g(*, n, un, n); // det, det + g(*, n, up, n); // ok, det + + g(*, un, n, n); // det, det + g(*, up, n, n); // ok, det + + g(*, un, un, n); // det, det + g(*, un, up, n); // det, det + g(*, up, un, n); // det, det + g(*, up, up, n); // undetected bad imul; det, det + + g(*, un, p, n); // det, det + g(*, up, p, n); // undetected bad imul; det, det + + g(*, p, un, n); // det, det + g(*, p, up, n); // undetected bad imul; det, det + + return 0; +} diff --git a/exp-sgcheck/tests/imul.stderr.exp b/exp-sgcheck/tests/imul.stderr.exp new file mode 100644 index 00000000..08f553da --- /dev/null +++ b/exp-sgcheck/tests/imul.stderr.exp @@ -0,0 +1,237 @@ + +about to do 14 [0] +Invalid read of size 4 + at 0x........: main (imul.c:14) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 14 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:14) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 16 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:16) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 16 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:16) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 18 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:18) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 18 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:18) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block + +Invalid IMUL + at 0x........: main (imul.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Both args derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +about to do 20 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 20 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 22 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:22) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 22 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:22) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 23 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:23) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 23 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:23) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 25 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:25) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 25 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:25) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 26 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:26) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 26 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:26) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 28 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:28) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 28 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:28) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 29 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:29) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 29 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:29) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 30 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:30) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 30 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:30) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 31 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:31) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 31 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:31) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 33 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:33) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 33 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:33) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 34 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:34) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 34 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:34) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 36 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:36) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 36 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:36) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 37 [0] + +Invalid read of size 4 + at 0x........: main (imul.c:37) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 37 [-1] + +Invalid read of size 4 + at 0x........: main (imul.c:37) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block + + +ERROR SUMMARY: 33 errors from 33 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/imul.vgtest-disabled b/exp-sgcheck/tests/imul.vgtest-disabled new file mode 100644 index 00000000..c2203640 --- /dev/null +++ b/exp-sgcheck/tests/imul.vgtest-disabled @@ -0,0 +1,2 @@ +prog: imul +stderr_filter: filter_add diff --git a/exp-sgcheck/tests/is_arch_supported b/exp-sgcheck/tests/is_arch_supported new file mode 100755 index 00000000..bdf2e7f8 --- /dev/null +++ b/exp-sgcheck/tests/is_arch_supported @@ -0,0 +1,15 @@ +#!/bin/sh +# +# Not all architectures are supported by exp-ptr. Currently, PowerPC, s390x +# and ARM are not supported and will fail these tests as follows: +# WARNING: exp-ptrcheck on <blah> platforms: stack and global array +# WARNING: checking is not currently supported. Only heap checking is +# WARNING: supported. +# +# So we use this script to prevent these tests from running on unsupported +# architectures. + +case `uname -i` in + ppc*|arm*|s390x) exit 1;; + *) exit 0;; +esac diff --git a/exp-sgcheck/tests/justify.c b/exp-sgcheck/tests/justify.c new file mode 100644 index 00000000..366c78ba --- /dev/null +++ b/exp-sgcheck/tests/justify.c @@ -0,0 +1,23 @@ +#include <stdlib.h> +#include <assert.h> + +// This is an example of an error found by Annelid, but not found by +// Memcheck -- because the wild read goes past the redzones of the pointer's +// block. +// +// Nb: for Memcheck to not spot this, relies on it putting the 2nd block in +// memory after the 1st block. + +int main ( void ) +{ + char c __attribute__((unused)); + char *c0, *c1; + + c0 = malloc(10000); + c1 = malloc(10000); + assert(c0 && c1); + + c = c0[15000]; + + return 0; +} diff --git a/exp-sgcheck/tests/justify.stderr.exp b/exp-sgcheck/tests/justify.stderr.exp new file mode 100644 index 00000000..0aede4bd --- /dev/null +++ b/exp-sgcheck/tests/justify.stderr.exp @@ -0,0 +1,10 @@ + +Invalid read of size 1 + at 0x........: main (justify.c:20) + Address 0x........ is 5000 bytes after the accessing pointer's + legitimate range, a block of size 10000 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (justify.c:16) + + +ERROR SUMMARY: 1 errors from 1 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/justify.vgtest b/exp-sgcheck/tests/justify.vgtest new file mode 100644 index 00000000..3052c7e6 --- /dev/null +++ b/exp-sgcheck/tests/justify.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: justify diff --git a/exp-sgcheck/tests/mm.c b/exp-sgcheck/tests/mm.c new file mode 100644 index 00000000..0d78cf36 --- /dev/null +++ b/exp-sgcheck/tests/mm.c @@ -0,0 +1,59 @@ +#include "tests/sys_mman.h" +#include <unistd.h> +#include "arith_include1.c" + +// For some reason, the stack frame below __GI_write is disappearing. +// Therefore, if I don't want the write errors to be merged, I have to +// ensure they have a different stack trace. I do this by using this +// function. Weird. +void mywrite(char* buf, int len) +{ + write(-1, buf, len); +} + +int main(void) +{ + struct sigaction sigsegv; + + char c __attribute__((unused)); + + // This fails due to a bad fd (at one point I was not handling failing + // mmap() calls, and would have got a seg fault). + char* res1 = mmap(0, 0, PROT_READ, MAP_PRIVATE, -1, 0 ); + + // This succeeds but is meaningless. Important thing is that the size is + // zero, so Annelid should not subtract one from the size when doing any + // range calculations. (It did at one point, giving 0xffffffff, which + // screwed everything up.) + char* res2 = mmap(0, 0, PROT_READ, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0 ); + + // This succeeds and is useful. + char* res3 = mmap(0, getpagesize(), PROT_READ, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0); + + assert(MAP_FAILED == res1); + assert(NULL == res2); + assert(MAP_FAILED != res3 && NULL != res3); + + // Intall SEGV handler + sigsegv.sa_handler = SEGV_handler; + sigsegv.sa_flags = 0; + assert( 0 == sigemptyset( &sigsegv.sa_mask ) ); + assert( 0 == sigaction(SIGSEGV, &sigsegv, NULL) ); + + #define TTT(i) \ + if (__builtin_setjmp(TTT_jmpbuf) == 0) { c = res3[i]; } + + TTT(0); + TTT(-1); + mywrite(res3, 5); + mywrite(res3-1, 5); + + assert( 0 == munmap(res3, getpagesize()) ); + + TTT(0); + TTT(-1); + mywrite(res3, 5); + mywrite(res3-1, 5); + + return 0; +} diff --git a/exp-sgcheck/tests/mm.stderr.exp b/exp-sgcheck/tests/mm.stderr.exp new file mode 100644 index 00000000..83be5a53 --- /dev/null +++ b/exp-sgcheck/tests/mm.stderr.exp @@ -0,0 +1,65 @@ + +Invalid read of size 1 + at 0x........: main (mm.c:47) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is 1 bytes before the accessing pointer's + legitimate range, the 4096-byte block mmap'd + at 0x........: __mmap (in /...libc...) +Warning: invalid file descriptor -1 in syscall write() +Warning: invalid file descriptor -1 in syscall write() + +Syscall param write(buf) is non-contiguous + at 0x........: __libc_write (...libc...) + by 0x........: main (mm.c:49) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First byte is not within a known block +Last byte (0x........) is 3 bytes within a 4096-byte block mmap'd + at 0x........: __mmap (in /...libc...) + +Invalid read of size 1 + at 0x........: main (mm.c:53) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is 0 bytes inside the accessing pointer's + once-legitimate range, the 4096-byte block munmap'd + at 0x........: __munmap (in /...libc...) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + +Doubly-invalid read of size 1 + at 0x........: main (mm.c:54) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is 1 bytes before the accessing pointer's + once-legitimate range, the 4096-byte block munmap'd + at 0x........: __munmap (in /...libc...) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Warning: invalid file descriptor -1 in syscall write() + +Syscall param write(buf) contains unaddressable byte(s) + at 0x........: __libc_write (...libc...) + by 0x........: main (mm.c:55) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is 0 bytes within a 4096-byte block munmap'd + at 0x........: __munmap (in /...libc...) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Warning: invalid file descriptor -1 in syscall write() + +Syscall param write(buf) is non-contiguous + at 0x........: __libc_write (...libc...) + by 0x........: main (mm.c:56) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First byte is not within a known block +Last byte (0x........) is 3 bytes within a 4096-byte block munmap'd + at 0x........: __munmap (in /...libc...) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + + +ERROR SUMMARY: 6 errors from 6 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/mm.vgtest-disabled b/exp-sgcheck/tests/mm.vgtest-disabled new file mode 100644 index 00000000..ab3d50e9 --- /dev/null +++ b/exp-sgcheck/tests/mm.vgtest-disabled @@ -0,0 +1 @@ +prog: mm diff --git a/exp-sgcheck/tests/neg.c b/exp-sgcheck/tests/neg.c new file mode 100644 index 00000000..5ea77346 --- /dev/null +++ b/exp-sgcheck/tests/neg.c @@ -0,0 +1,25 @@ +#include <stdio.h> +#include <stdlib.h> +#include <signal.h> +#include <setjmp.h> +#include <assert.h> + +#include "arith_include1.c" + +int main(void) +{ + #include "arith_include2.c" + + // Neg ========================================================= + ui(-, p, n); // bad NEG; ok, det + + ui(-, up, n); // det, det + + ui(-, un, n); // det, det + + ui(-, n, n); // det, det + + ui(-, nn, n); // det, det + + return 0; +} diff --git a/exp-sgcheck/tests/neg.stderr.exp b/exp-sgcheck/tests/neg.stderr.exp new file mode 100644 index 00000000..1a6eea23 --- /dev/null +++ b/exp-sgcheck/tests/neg.stderr.exp @@ -0,0 +1,53 @@ + +about to do 14 [0] +Invalid read of size 4 + at 0x........: main (neg.c:14) + Address 0x........ is not derived from any known block +about to do 14 [-1] + +Invalid read of size 4 + at 0x........: main (neg.c:14) + Address 0x........ is not derived from any known block +about to do 16 [0] + +Invalid read of size 4 + at 0x........: main (neg.c:16) + Address 0x........ is not derived from any known block +about to do 16 [-1] + +Invalid read of size 4 + at 0x........: main (neg.c:16) + Address 0x........ is not derived from any known block +about to do 18 [0] + +Invalid read of size 4 + at 0x........: main (neg.c:18) + Address 0x........ is not derived from any known block +about to do 18 [-1] + +Invalid read of size 4 + at 0x........: main (neg.c:18) + Address 0x........ is not derived from any known block +about to do 20 [0] + +Invalid read of size 4 + at 0x........: main (neg.c:20) + Address 0x........ is not derived from any known block +about to do 20 [-1] + +Invalid read of size 4 + at 0x........: main (neg.c:20) + Address 0x........ is not derived from any known block +about to do 22 [0] + +Invalid read of size 4 + at 0x........: main (neg.c:22) + Address 0x........ is not derived from any known block +about to do 22 [-1] + +Invalid read of size 4 + at 0x........: main (neg.c:22) + Address 0x........ is not derived from any known block + + +ERROR SUMMARY: 10 errors from 10 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/neg.vgtest-disabled b/exp-sgcheck/tests/neg.vgtest-disabled new file mode 100644 index 00000000..c546a43f --- /dev/null +++ b/exp-sgcheck/tests/neg.vgtest-disabled @@ -0,0 +1,2 @@ +prog: neg +stderr_filter: filter_add diff --git a/exp-sgcheck/tests/not.c b/exp-sgcheck/tests/not.c new file mode 100644 index 00000000..c5c08d13 --- /dev/null +++ b/exp-sgcheck/tests/not.c @@ -0,0 +1,25 @@ +#include <stdio.h> +#include <stdlib.h> +#include <signal.h> +#include <setjmp.h> +#include <assert.h> + +#include "arith_include1.c" + +int main(void) +{ + #include "arith_include2.c" + + // NOT ========================================================= + ui(~, p, n); // det, det + + ui(~, up, n); // det, det + + ui(~, un, n); // det, det + + ui(~, n, n); // det, det + + ui(~, nn, n); // det, det + + return 0; +} diff --git a/exp-sgcheck/tests/not.stderr.exp b/exp-sgcheck/tests/not.stderr.exp new file mode 100644 index 00000000..0a5b8d7c --- /dev/null +++ b/exp-sgcheck/tests/not.stderr.exp @@ -0,0 +1,73 @@ + +about to do 14 [0] +Invalid read of size 4 + at 0x........: main (not.c:14) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 14 [-1] + +Invalid read of size 4 + at 0x........: main (not.c:14) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 16 [0] + +Invalid read of size 4 + at 0x........: main (not.c:16) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 16 [-1] + +Invalid read of size 4 + at 0x........: main (not.c:16) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 18 [0] + +Invalid read of size 4 + at 0x........: main (not.c:18) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 18 [-1] + +Invalid read of size 4 + at 0x........: main (not.c:18) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 20 [0] + +Invalid read of size 4 + at 0x........: main (not.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 20 [-1] + +Invalid read of size 4 + at 0x........: main (not.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 22 [0] + +Invalid read of size 4 + at 0x........: main (not.c:22) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block +about to do 22 [-1] + +Invalid read of size 4 + at 0x........: main (not.c:22) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is not derived from any known block + + +ERROR SUMMARY: 10 errors from 10 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/not.vgtest-disabled b/exp-sgcheck/tests/not.vgtest-disabled new file mode 100644 index 00000000..266c349f --- /dev/null +++ b/exp-sgcheck/tests/not.vgtest-disabled @@ -0,0 +1,2 @@ +prog: not +stderr_filter: filter_add diff --git a/exp-sgcheck/tests/or.c b/exp-sgcheck/tests/or.c new file mode 100644 index 00000000..6fd2128f --- /dev/null +++ b/exp-sgcheck/tests/or.c @@ -0,0 +1,42 @@ +#include <stdio.h> +#include <stdlib.h> +#include <signal.h> +#include <setjmp.h> +#include <assert.h> + +#include "arith_include1.c" + +int main(void) +{ + #include "arith_include2.c" + + // OR ========================================================== + g(|, n, n, n); // det, det + + g(|, n, p, p); // ok, det + + g(|, p, n, p); // ok, det + + g(|, p, p, e); // detected bad OR; ok, det + g(|, p, p2, e); // detected bad OR; det, det + + g(|, n, un, u); // undet, undet + g(|, n, up, u); // ok, undet + + g(|, un, n, u); // undet, undet + g(|, up, n, u); // ok, undet + + g(|, un, un, u); // undet, undet + g(|, un, up, u); // ok, undet + g(|, up, un, u); // ok, undet + g(|, up, up, u); // undetected bad OR; ok, undet + g(|, up, up2,u); // undetected bad OR; undet, undet + + g(|, un, p, u); // ok, undet + g(|, up, p, u); // undetected bad OR; undet, undet + + g(|, p, un, u); // ok, undet + g(|, p, up, u); // undetected bad OR; undet, undet + + return 0; +} diff --git a/exp-sgcheck/tests/or.stderr.exp b/exp-sgcheck/tests/or.stderr.exp new file mode 100644 index 00000000..e0f9b56f --- /dev/null +++ b/exp-sgcheck/tests/or.stderr.exp @@ -0,0 +1,92 @@ + +about to do 14 [0] +Invalid read of size 4 + at 0x........: main (or.c:14) + Address 0x........ is not derived from any known block +about to do 14 [-1] + +Invalid read of size 4 + at 0x........: main (or.c:14) + Address 0x........ is not derived from any known block +about to do 16 [0] +about to do 16 [-1] + +Invalid read of size 4 + at 0x........: main (or.c:16) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 18 [0] +about to do 18 [-1] + +Invalid read of size 4 + at 0x........: main (or.c:18) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + +Invalid OR + at 0x........: main (or.c:20) +Both args derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 20 [0] + +Invalid read of size 4 + at 0x........: main (or.c:20) + Address 0x........ is not derived from any known block +about to do 20 [-1] + +Invalid read of size 4 + at 0x........: main (or.c:20) + Address 0x........ is not derived from any known block + +Invalid arguments to Or32/Or64 + at 0x........: main (or.c:21) + First arg derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + Second arg derived from address 0x........ of 40-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 21 [0] + +Invalid read of size 4 + at 0x........: main (or.c:21) + Address 0x........ is not derived from any known block +about to do 21 [-1] + +Invalid read of size 4 + at 0x........: main (or.c:21) + Address 0x........ is not derived from any known block +about to do 23 [0] +about to do 23 [-1] +about to do 24 [0] +about to do 24 [-1] +about to do 26 [0] +about to do 26 [-1] +about to do 27 [0] +about to do 27 [-1] +about to do 29 [0] +about to do 29 [-1] +about to do 30 [0] +about to do 30 [-1] +about to do 31 [0] +about to do 31 [-1] +about to do 32 [0] +about to do 32 [-1] +about to do 33 [0] +about to do 33 [-1] +about to do 35 [0] +about to do 35 [-1] +about to do 36 [0] +about to do 36 [-1] +about to do 38 [0] +about to do 38 [-1] +about to do 39 [0] +about to do 39 [-1] + + +ERROR SUMMARY: 10 errors from 10 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/or.vgtest-disabled b/exp-sgcheck/tests/or.vgtest-disabled new file mode 100644 index 00000000..9a714a16 --- /dev/null +++ b/exp-sgcheck/tests/or.vgtest-disabled @@ -0,0 +1,2 @@ +prog: or +stderr_filter: filter_add diff --git a/exp-sgcheck/tests/partial.c b/exp-sgcheck/tests/partial.c new file mode 100644 index 00000000..af072815 --- /dev/null +++ b/exp-sgcheck/tests/partial.c @@ -0,0 +1,52 @@ + +#include <stdlib.h> + +int main ( void ) +{ + int* x3 = malloc(3); float f __attribute__((unused)), *f3 = malloc(3); + int* x4 = malloc(4); double d __attribute__((unused)), *d7 = malloc(7); + int* x5 = malloc(5); long long int lli __attribute__((unused)), *lli7 = malloc(7); + int* x6 = malloc(6); char c __attribute__((unused)), *c0 = malloc(0); + int* x7 = malloc(7); short int s __attribute__((unused)), *s1 = malloc(1); + int x __attribute__((unused)); + int* y4 = malloc(4); + int* y5 = malloc(5); + int* y6 = malloc(6); + int* y7 = malloc(7); + + #define ADDB(ptr, n) ((int*)(((unsigned long)(ptr)) + (n))) + + // All these overrun by a single byte; the reads are happening at + // different alignments. + x = * ADDB(x3,0); // ok if --partial-loads-ok=yes + x = * ADDB(x4,1); + x = * ADDB(x5,2); + x = * ADDB(x6,3); + x = * ADDB(x7,4); // ok if --partial-loads-ok=yes + + // These are fine + x = * ADDB(y4,0); + x = * ADDB(y5,1); + x = * ADDB(y6,2); + x = * ADDB(y7,3); + + // These are all bad, at different points along + x = * ADDB(x3,-1); // before + x = * ADDB(x3, 0); // inside // ok if --partial-loads-ok=yes ... + x = * ADDB(x3, 1); // inside // ... but only on 32 bit platforms + x = * ADDB(x3, 2); // inside // ... ditto + x = * ADDB(x3, 3); // after + + // These are all bad + f = * f3; // ok if --partial-loads-ok=yes // ... ditto + d = * d7; + lli = * lli7; // ok if --partial-loads-ok=yes see XXX below + c = * c0; + s = * s1; + + return 0; +} + +/* Note re XXX, this gives different behaviour on 32 and 64 bit +platforms, because on 64-bit it's one load whereas as on 32 bit +platforms it's necessarily 2 32-bit loads, and the first one is OK. */ diff --git a/exp-sgcheck/tests/partial_bad.stderr.exp-glibc25-amd64 b/exp-sgcheck/tests/partial_bad.stderr.exp-glibc25-amd64 new file mode 100644 index 00000000..58888f93 --- /dev/null +++ b/exp-sgcheck/tests/partial_bad.stderr.exp-glibc25-amd64 @@ -0,0 +1,108 @@ + +Invalid read of size 4 + at 0x........: main (partial.c:21) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:22) + Address 0x........ is 1 bytes inside the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:7) + +Invalid read of size 4 + at 0x........: main (partial.c:23) + Address 0x........ is 2 bytes inside the accessing pointer's + legitimate range, a block of size 5 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:8) + +Invalid read of size 4 + at 0x........: main (partial.c:24) + Address 0x........ is 3 bytes inside the accessing pointer's + legitimate range, a block of size 6 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:9) + +Invalid read of size 4 + at 0x........: main (partial.c:25) + Address 0x........ is 4 bytes inside the accessing pointer's + legitimate range, a block of size 7 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:10) + +Invalid read of size 4 + at 0x........: main (partial.c:34) + Address 0x........ is 1 bytes before the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:35) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:36) + Address 0x........ is 1 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:37) + Address 0x........ is 2 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:38) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:41) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 8 + at 0x........: main (partial.c:42) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 7 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:7) + +Invalid read of size 8 + at 0x........: main (partial.c:43) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 7 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:8) + +Invalid read of size 1 + at 0x........: main (partial.c:44) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 0 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:9) + +Invalid read of size 2 + at 0x........: main (partial.c:45) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 1 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:10) + + +ERROR SUMMARY: 15 errors from 15 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/partial_bad.stderr.exp-glibc25-x86 b/exp-sgcheck/tests/partial_bad.stderr.exp-glibc25-x86 new file mode 100644 index 00000000..c365a2b2 --- /dev/null +++ b/exp-sgcheck/tests/partial_bad.stderr.exp-glibc25-x86 @@ -0,0 +1,108 @@ + +Invalid read of size 4 + at 0x........: main (partial.c:21) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:22) + Address 0x........ is 1 bytes inside the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:7) + +Invalid read of size 4 + at 0x........: main (partial.c:23) + Address 0x........ is 2 bytes inside the accessing pointer's + legitimate range, a block of size 5 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:8) + +Invalid read of size 4 + at 0x........: main (partial.c:24) + Address 0x........ is 3 bytes inside the accessing pointer's + legitimate range, a block of size 6 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:9) + +Invalid read of size 4 + at 0x........: main (partial.c:25) + Address 0x........ is 4 bytes inside the accessing pointer's + legitimate range, a block of size 7 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:10) + +Invalid read of size 4 + at 0x........: main (partial.c:34) + Address 0x........ is 1 bytes before the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:35) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:36) + Address 0x........ is 1 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:37) + Address 0x........ is 2 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:38) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:41) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 8 + at 0x........: main (partial.c:42) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 7 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:7) + +Invalid read of size 4 + at 0x........: main (partial.c:43) + Address 0x........ is 4 bytes inside the accessing pointer's + legitimate range, a block of size 7 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:8) + +Invalid read of size 1 + at 0x........: main (partial.c:44) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 0 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:9) + +Invalid read of size 2 + at 0x........: main (partial.c:45) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 1 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:10) + + +ERROR SUMMARY: 15 errors from 15 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/partial_bad.vgtest b/exp-sgcheck/tests/partial_bad.vgtest new file mode 100644 index 00000000..094946b6 --- /dev/null +++ b/exp-sgcheck/tests/partial_bad.vgtest @@ -0,0 +1,3 @@ +prereq: ./is_arch_supported +prog: partial +vgopts: --partial-loads-ok=no diff --git a/exp-sgcheck/tests/partial_good.stderr.exp-glibc25-amd64 b/exp-sgcheck/tests/partial_good.stderr.exp-glibc25-amd64 new file mode 100644 index 00000000..3b72c0e6 --- /dev/null +++ b/exp-sgcheck/tests/partial_good.stderr.exp-glibc25-amd64 @@ -0,0 +1,94 @@ + +Invalid read of size 4 + at 0x........: main (partial.c:21) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:22) + Address 0x........ is 1 bytes inside the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:7) + +Invalid read of size 4 + at 0x........: main (partial.c:23) + Address 0x........ is 2 bytes inside the accessing pointer's + legitimate range, a block of size 5 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:8) + +Invalid read of size 4 + at 0x........: main (partial.c:24) + Address 0x........ is 3 bytes inside the accessing pointer's + legitimate range, a block of size 6 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:9) + +Invalid read of size 4 + at 0x........: main (partial.c:25) + Address 0x........ is 4 bytes inside the accessing pointer's + legitimate range, a block of size 7 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:10) + +Invalid read of size 4 + at 0x........: main (partial.c:34) + Address 0x........ is 1 bytes before the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:35) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:36) + Address 0x........ is 1 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:37) + Address 0x........ is 2 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:38) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:41) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 1 + at 0x........: main (partial.c:44) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 0 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:9) + +Invalid read of size 2 + at 0x........: main (partial.c:45) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 1 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:10) + + +ERROR SUMMARY: 13 errors from 13 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/partial_good.stderr.exp-glibc25-x86 b/exp-sgcheck/tests/partial_good.stderr.exp-glibc25-x86 new file mode 100644 index 00000000..0f9bd892 --- /dev/null +++ b/exp-sgcheck/tests/partial_good.stderr.exp-glibc25-x86 @@ -0,0 +1,73 @@ + +Invalid read of size 4 + at 0x........: main (partial.c:22) + Address 0x........ is 1 bytes inside the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:7) + +Invalid read of size 4 + at 0x........: main (partial.c:23) + Address 0x........ is 2 bytes inside the accessing pointer's + legitimate range, a block of size 5 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:8) + +Invalid read of size 4 + at 0x........: main (partial.c:24) + Address 0x........ is 3 bytes inside the accessing pointer's + legitimate range, a block of size 6 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:9) + +Invalid read of size 4 + at 0x........: main (partial.c:34) + Address 0x........ is 1 bytes before the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:36) + Address 0x........ is 1 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:37) + Address 0x........ is 2 bytes inside the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 4 + at 0x........: main (partial.c:38) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 3 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:6) + +Invalid read of size 8 + at 0x........: main (partial.c:42) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 7 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:7) + +Invalid read of size 1 + at 0x........: main (partial.c:44) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 0 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:9) + +Invalid read of size 2 + at 0x........: main (partial.c:45) + Address 0x........ is 0 bytes inside the accessing pointer's + legitimate range, a block of size 1 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (partial.c:10) + + +ERROR SUMMARY: 10 errors from 10 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/partial_good.vgtest b/exp-sgcheck/tests/partial_good.vgtest new file mode 100644 index 00000000..ea7d2855 --- /dev/null +++ b/exp-sgcheck/tests/partial_good.vgtest @@ -0,0 +1,3 @@ +prereq: ./is_arch_supported +prog: partial +vgopts: --partial-loads-ok=yes diff --git a/exp-sgcheck/tests/preen_invars.c b/exp-sgcheck/tests/preen_invars.c new file mode 100644 index 00000000..cef91be3 --- /dev/null +++ b/exp-sgcheck/tests/preen_invars.c @@ -0,0 +1,52 @@ + +#include <stdio.h> +#include <assert.h> +#include <dlfcn.h> + +/* see comments in preen_invar_so.c for explanation of this */ + + +int main ( void ) +{ + int i, r, sum = 0; + char* im_a_global_array; + void* hdl = dlopen("./preen_invars_so.so", RTLD_NOW); + assert(hdl); + im_a_global_array = dlsym(hdl, "im_a_global_array"); + assert(im_a_global_array); + /* printf("%p %p\n", im_a_global_array, me_too_me_too); */ + + /* poke around in the global array, so as to cause exp-ptrcheck + to generate an Inv_Global invar for it. */ + for (i = 10/*ERROR*/; i >= 0; i--) { + sum += im_a_global_array[i]; + } + /* iterating 10 .. 0 causes an Unknown->Global transition at i = 9. + We do it this way in order that at the end of a loop, there is a + Global invar in place for the memory read in the loop, so that + the subsequent dlclose (hence munmap) causes it to get preened. + + Unfortunately there's nothing to show that the preen was + successful or happened at all. The only way to see is from the + -v output: + + --686-- sg_: 251 Invars preened, of which 1 changed + + It's the "1 changed" bit which is significant. + */ + + /* let's hope gcc is not clever enough to optimise this away, since + if it does, then it will also nuke the preceding loop, and + thereby render this test program useless. */ + + if (sum & 1) printf("%s bar %d\n", "foo", sum & 1); else + printf("foo %s %d\n", "bar", 1 - (sum & 1)); + + /* Now close (== unmap) the array, so that exp-ptrcheck has to check + its collection of Inv_Global invars, and remove this one from + it. */ + r = dlclose(hdl); + assert(r == 0); + + return 0; +} diff --git a/exp-sgcheck/tests/preen_invars.stderr.exp-glibc28-amd64 b/exp-sgcheck/tests/preen_invars.stderr.exp-glibc28-amd64 new file mode 100644 index 00000000..47e35137 --- /dev/null +++ b/exp-sgcheck/tests/preen_invars.stderr.exp-glibc28-amd64 @@ -0,0 +1,9 @@ + +Invalid read of size 1 + at 0x........: main (preen_invars.c:22) + Address 0x........ expected vs actual: + Expected: unknown + Actual: global array "im_a_global_arr" in object with soname "preen_invars_so" + + +ERROR SUMMARY: 1 errors from 1 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/preen_invars.stdout.exp b/exp-sgcheck/tests/preen_invars.stdout.exp new file mode 100644 index 00000000..b3162bea --- /dev/null +++ b/exp-sgcheck/tests/preen_invars.stdout.exp @@ -0,0 +1 @@ +foo bar 1 diff --git a/exp-sgcheck/tests/preen_invars.vgtest b/exp-sgcheck/tests/preen_invars.vgtest new file mode 100644 index 00000000..49da4bb9 --- /dev/null +++ b/exp-sgcheck/tests/preen_invars.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: preen_invars diff --git a/exp-sgcheck/tests/preen_invars_so.c b/exp-sgcheck/tests/preen_invars_so.c new file mode 100644 index 00000000..0e59d9ce --- /dev/null +++ b/exp-sgcheck/tests/preen_invars_so.c @@ -0,0 +1,12 @@ + +/* This file contains a global array. It is compiled into a .so, + which is dlopened by preen_invar.c. That then accesses the global + array, hence generating Inv_Global invariants in sg_main.c. + + preen_invar.c then dlcloses this object, causing it to get + unmapped; and we then need to be sure that the Inv_Global is + removed by preen_Invars (or, at least, that the system doesn't + crash..). */ + +char im_a_global_array[10]; + diff --git a/exp-sgcheck/tests/pth_create.c b/exp-sgcheck/tests/pth_create.c new file mode 100644 index 00000000..2c2d5bb3 --- /dev/null +++ b/exp-sgcheck/tests/pth_create.c @@ -0,0 +1,22 @@ + +#include <pthread.h> +#include <stdlib.h> + + + +// This demonstrates an error for a pre_mem_{read,write} event that comes +// from the core, rather than a syscall (ie. part == Vg_CorePart instead of +// part == Vg_CoreSyscall). + + +int main(void) +{ + pthread_key_t* key = malloc(sizeof(pthread_key_t)); + pthread_key_t* key2 = malloc(sizeof(pthread_key_t)); + + pthread_key_create ( (pthread_key_t*)((long)key + 1), NULL ); + free(key2); + pthread_key_create ( key2 , NULL ); + + return 0; +} diff --git a/exp-sgcheck/tests/pth_create.stderr.exp b/exp-sgcheck/tests/pth_create.stderr.exp new file mode 100644 index 00000000..0fab75fa --- /dev/null +++ b/exp-sgcheck/tests/pth_create.stderr.exp @@ -0,0 +1,19 @@ + +Invalid write of size 4 + at 0x........: pthread_key_create (in /...libpthread...) + by 0x........: main (pth_create.c:17) + Address 0x........ is 1 bytes inside the accessing pointer's + legitimate range, a block of size 4 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (pth_create.c:14) + +Invalid write of size 4 + at 0x........: pthread_key_create (in /...libpthread...) + by 0x........: main (pth_create.c:19) + Address 0x........ is 0 bytes inside the accessing pointer's + once-legitimate range, a block of size 4 free'd + at 0x........: free (vg_replace_malloc.c:...) + by 0x........: main (pth_create.c:18) + + +ERROR SUMMARY: 2 errors from 2 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/pth_create.vgtest b/exp-sgcheck/tests/pth_create.vgtest new file mode 100644 index 00000000..91fa9b13 --- /dev/null +++ b/exp-sgcheck/tests/pth_create.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: pth_create diff --git a/exp-sgcheck/tests/pth_specific.c b/exp-sgcheck/tests/pth_specific.c new file mode 100644 index 00000000..9b8ca919 --- /dev/null +++ b/exp-sgcheck/tests/pth_specific.c @@ -0,0 +1,34 @@ +#include <pthread.h> +#include <assert.h> +#include <stdlib.h> + +// This shows that putting a segment pointer into a thread-specific data +// area and then getting it out again doesn't lose info -- even though the +// key allocation/getting is done on the real CPU where the skin can't see, +// the get/set of the info is done using that key on the simd CPU where it +// can see, so everything works out fine. + +int main(void) +{ + pthread_key_t key; + char *x, *z; + char y __attribute__((unused)); + + x = malloc(100); + + y = x[-1]; // error + x[1] = 'z'; + + assert( 0 == pthread_key_create ( &key, NULL ) ); + assert( 0 == pthread_setspecific( key, x ) ); + z = (char*)pthread_getspecific( key ); + assert( 0 != z ); + + y = z[-1]; // error + + // ensure the key went in and out correctly + assert(z == x); + assert(z[1] == 'z'); + + return 0; +} diff --git a/exp-sgcheck/tests/pth_specific.stderr.exp b/exp-sgcheck/tests/pth_specific.stderr.exp new file mode 100644 index 00000000..1b5cef41 --- /dev/null +++ b/exp-sgcheck/tests/pth_specific.stderr.exp @@ -0,0 +1,17 @@ + +Invalid read of size 1 + at 0x........: main (pth_specific.c:19) + Address 0x........ is 1 bytes before the accessing pointer's + legitimate range, a block of size 100 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (pth_specific.c:17) + +Invalid read of size 1 + at 0x........: main (pth_specific.c:27) + Address 0x........ is 1 bytes before the accessing pointer's + legitimate range, a block of size 100 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (pth_specific.c:17) + + +ERROR SUMMARY: 2 errors from 2 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/pth_specific.vgtest b/exp-sgcheck/tests/pth_specific.vgtest new file mode 100644 index 00000000..5e6789b6 --- /dev/null +++ b/exp-sgcheck/tests/pth_specific.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: pth_specific diff --git a/exp-sgcheck/tests/realloc.c b/exp-sgcheck/tests/realloc.c new file mode 100644 index 00000000..8884664e --- /dev/null +++ b/exp-sgcheck/tests/realloc.c @@ -0,0 +1,46 @@ + +#include <stdlib.h> + +int main(void) +{ + int i __attribute__((unused)); + int* y __attribute__((unused)); + int** x = malloc(sizeof(int*) * 100); + int* x2 = malloc(sizeof(int) * 100); + void* sink __attribute__((unused)); + x[0] = x2; // this is to check the pointerness is copied across ok + x[49] = x2; // this is to check the pointerness is copied across ok + + i = *x[0]; + i = *x[49]; + + x = realloc(x, sizeof(int*)*50); // smaller + y = x[0]; // ok + y = x[49]; // ok + y = x[-1]; // bad + y = x[50]; // bad + i = *x[0]; // ok + i = *x[49]; // ok + + x = realloc(x, sizeof(int*)*50); // same size + y = x[0]; // ok + y = x[49]; // ok + y = x[-1]; // bad + y = x[50]; // bad + i = *x[0]; // ok + i = *x[49]; // ok + + x = realloc(x, sizeof(int*)*100); // bigger + y = x[0]; // ok + y = x[49]; // ok + y = x[50]; // ok + y = x[99]; // ok + y = x[-1]; // bad + y = x[100]; // bad + i = *x[0]; // ok + i = *x[49]; // ok + + sink = realloc((void*)0x99, 10); // fails + + return 0; +} diff --git a/exp-sgcheck/tests/realloc.stderr.exp-glibc25-amd64 b/exp-sgcheck/tests/realloc.stderr.exp-glibc25-amd64 new file mode 100644 index 00000000..99c551b7 --- /dev/null +++ b/exp-sgcheck/tests/realloc.stderr.exp-glibc25-amd64 @@ -0,0 +1,45 @@ + +Invalid read of size 8 + at 0x........: main (realloc.c:20) + Address 0x........ is 8 bytes before the accessing pointer's + legitimate range, a block of size 400 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:17) + +Invalid read of size 8 + at 0x........: main (realloc.c:21) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 400 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:17) + +Invalid read of size 8 + at 0x........: main (realloc.c:28) + Address 0x........ is 8 bytes before the accessing pointer's + legitimate range, a block of size 400 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:25) + +Invalid read of size 8 + at 0x........: main (realloc.c:29) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 400 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:25) + +Invalid read of size 8 + at 0x........: main (realloc.c:38) + Address 0x........ is 8 bytes before the accessing pointer's + legitimate range, a block of size 800 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:33) + +Invalid read of size 8 + at 0x........: main (realloc.c:39) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 800 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:33) + + +ERROR SUMMARY: 6 errors from 6 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/realloc.stderr.exp-glibc25-x86 b/exp-sgcheck/tests/realloc.stderr.exp-glibc25-x86 new file mode 100644 index 00000000..265f48cc --- /dev/null +++ b/exp-sgcheck/tests/realloc.stderr.exp-glibc25-x86 @@ -0,0 +1,45 @@ + +Invalid read of size 4 + at 0x........: main (realloc.c:20) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 200 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:17) + +Invalid read of size 4 + at 0x........: main (realloc.c:21) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 200 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:17) + +Invalid read of size 4 + at 0x........: main (realloc.c:28) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 200 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:25) + +Invalid read of size 4 + at 0x........: main (realloc.c:29) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 200 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:25) + +Invalid read of size 4 + at 0x........: main (realloc.c:38) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 400 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:33) + +Invalid read of size 4 + at 0x........: main (realloc.c:39) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 400 alloc'd + at 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (realloc.c:33) + + +ERROR SUMMARY: 6 errors from 6 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/realloc.vgtest b/exp-sgcheck/tests/realloc.vgtest new file mode 100644 index 00000000..1cc74ede --- /dev/null +++ b/exp-sgcheck/tests/realloc.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: realloc diff --git a/exp-sgcheck/tests/sh_script b/exp-sgcheck/tests/sh_script new file mode 100755 index 00000000..ca2b0b8a --- /dev/null +++ b/exp-sgcheck/tests/sh_script @@ -0,0 +1,4 @@ +#! /bin/bash +if [ $# != 0 ] ; then + echo "too many args" +fi diff --git a/exp-sgcheck/tests/sh_script.stderr.exp b/exp-sgcheck/tests/sh_script.stderr.exp new file mode 100644 index 00000000..d18786f8 --- /dev/null +++ b/exp-sgcheck/tests/sh_script.stderr.exp @@ -0,0 +1,3 @@ + + +ERROR SUMMARY: 0 errors from 0 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/sh_script.vgtest-disabled b/exp-sgcheck/tests/sh_script.vgtest-disabled new file mode 100644 index 00000000..5942de2c --- /dev/null +++ b/exp-sgcheck/tests/sh_script.vgtest-disabled @@ -0,0 +1 @@ +prog: sh_script diff --git a/exp-sgcheck/tests/stackerr.c b/exp-sgcheck/tests/stackerr.c new file mode 100644 index 00000000..36b8e672 --- /dev/null +++ b/exp-sgcheck/tests/stackerr.c @@ -0,0 +1,53 @@ + +/* Check basic stack overflow detection. + + It's difficult to get consistent behaviour across all platforms. + For example, x86 w/ gcc-4.3.1 gives + + Expected: stack array "a" in frame 2 back from here + Actual: stack array "beforea" in frame 2 back from here + + whereas amd64 w/ gcc-4.3.1 gives + + Expected: stack array "a" in frame 2 back from here + Actual: unknown + + This happens because on x86 the arrays are placed on the + stack without holes in between, but not so for amd64. I don't + know why. +*/ + + +#include <stdio.h> + +__attribute__((noinline)) void foo ( long* sa, int n ) +{ + int i; + for (i = 0; i < n; i++) + sa[i] = 0; +} + +__attribute__((noinline)) void bar ( long* sa, int n ) +{ + foo(sa, n); +} + +int main ( void ) +{ + int i; + long beforea[3]; + long a[7]; + long aftera[3]; + bar(a, 7+1); /* generates error */ + bar(a, 7+0); /* generates no error */ + for (i = 0; i < 7+1; i++) { + a[i] = 0; + } + {char beforebuf[8]; + char buf[8]; + char afterbuf[8]; + sprintf(buf, "%d", 123456789); + return 1 & ((a[4] + beforea[1] + aftera[1] + beforebuf[1] + + buf[2] + afterbuf[3]) / 100000) ; + } +} diff --git a/exp-sgcheck/tests/stackerr.stderr.exp-glibc27-x86 b/exp-sgcheck/tests/stackerr.stderr.exp-glibc27-x86 new file mode 100644 index 00000000..b876eafd --- /dev/null +++ b/exp-sgcheck/tests/stackerr.stderr.exp-glibc27-x86 @@ -0,0 +1,27 @@ + +Invalid write of size 4 + at 0x........: foo (stackerr.c:27) + by 0x........: bar (stackerr.c:32) + by 0x........: main (stackerr.c:41) + Address 0x........ expected vs actual: + Expected: stack array "a" in frame 2 back from here + Actual: stack array "beforea" in frame 2 back from here + +Invalid write of size 4 + at 0x........: main (stackerr.c:44) + Address 0x........ expected vs actual: + Expected: stack array "a" in this frame + Actual: stack array "beforea" in this frame + +Invalid write of size 1 + at 0x........: _IO_default_xsputn (in /...libc...) + by 0x........: ... + by 0x........: ... + by 0x........: ... + by 0x........: main (stackerr.c:49) + Address 0x........ expected vs actual: + Expected: stack array "buf" in frame 4 back from here + Actual: stack array "beforebuf" in frame 4 back from here + + +ERROR SUMMARY: 3 errors from 3 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/stackerr.stderr.exp-glibc28-amd64 b/exp-sgcheck/tests/stackerr.stderr.exp-glibc28-amd64 new file mode 100644 index 00000000..89da7a77 --- /dev/null +++ b/exp-sgcheck/tests/stackerr.stderr.exp-glibc28-amd64 @@ -0,0 +1,27 @@ + +Invalid write of size 8 + at 0x........: foo (stackerr.c:27) + by 0x........: bar (stackerr.c:32) + by 0x........: main (stackerr.c:41) + Address 0x........ expected vs actual: + Expected: stack array "a" in frame 2 back from here + Actual: unknown + +Invalid write of size 8 + at 0x........: main (stackerr.c:44) + Address 0x........ expected vs actual: + Expected: stack array "a" in this frame + Actual: unknown + +Invalid write of size 1 + at 0x........: _IO_default_xsputn (in /...libc...) + by 0x........: ... + by 0x........: ... + by 0x........: ... + by 0x........: main (stackerr.c:49) + Address 0x........ expected vs actual: + Expected: stack array "buf" in frame 4 back from here + Actual: unknown + + +ERROR SUMMARY: 3 errors from 3 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/stackerr.stdout.exp b/exp-sgcheck/tests/stackerr.stdout.exp new file mode 100644 index 00000000..e69de29b --- /dev/null +++ b/exp-sgcheck/tests/stackerr.stdout.exp diff --git a/exp-sgcheck/tests/stackerr.vgtest b/exp-sgcheck/tests/stackerr.vgtest new file mode 100644 index 00000000..0a1139df --- /dev/null +++ b/exp-sgcheck/tests/stackerr.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: stackerr diff --git a/exp-sgcheck/tests/strcpy.c b/exp-sgcheck/tests/strcpy.c new file mode 100644 index 00000000..83522975 --- /dev/null +++ b/exp-sgcheck/tests/strcpy.c @@ -0,0 +1,44 @@ +#include <stdlib.h> +#include <string.h> + +// This shows the case whereby subtraction between two pointers from +// different segments can be used legitimately. + +// dest: stack, src: heap +char* my_strcpy (char* dest, const char* src) +{ + char c, *s = (char *) src; + long off = dest - s; + off = off - 1; + do { + c = *s++; + s[off] = c; // s + off == dest + } while (c != '\0'); + return dest; +} + +int main(void) +{ + char* h = "hello, world"; + char* p1 = strdup(h); + char* p2 = strdup(h); + char u1[13]; + char u2[13]; + + // All these are legit + p1[p2-p1] = 0; // p-p (must be BADSEG'd) // ea is p2[0] + u1[p2-u1] = 0; // p-? + p1[u2-p1] = 0; // ?-p (must be BADSEG'd) + u1[u2-u1] = 0; // ?-? + + // All these are a 1-byte underrun + p1[p2-p1-1] = 0; // p-p (must be BADSEG'd) // ea is p2[-1] + u1[p2-u1-1] = 0; // p-? (undet) + p1[u2-p1-1] = 0; // ?-p (must be BADSEG'd) + u1[u2-u1-1] = 0; // ?-? (undet) + + my_strcpy(u1, p1); + my_strcpy(u2, u1); + + return 0; +} diff --git a/exp-sgcheck/tests/strcpy.stderr.exp b/exp-sgcheck/tests/strcpy.stderr.exp new file mode 100644 index 00000000..d18786f8 --- /dev/null +++ b/exp-sgcheck/tests/strcpy.stderr.exp @@ -0,0 +1,3 @@ + + +ERROR SUMMARY: 0 errors from 0 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/strcpy.vgtest b/exp-sgcheck/tests/strcpy.vgtest new file mode 100644 index 00000000..d686e9f3 --- /dev/null +++ b/exp-sgcheck/tests/strcpy.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: strcpy diff --git a/exp-sgcheck/tests/strlen.c b/exp-sgcheck/tests/strlen.c new file mode 100644 index 00000000..92abf461 --- /dev/null +++ b/exp-sgcheck/tests/strlen.c @@ -0,0 +1,33 @@ + +#include <stdlib.h> +#include <string.h> + +// glibc's versions of functions like strlen() do things word-wise instead +// of byte-wise, which means they can overrun the end of strings, etc. +// Naughty, but must be safe, I guess; Annelid copes with this in the same +// way Memcheck does, letting it happen unless the --partial-loads-ok=no +// option is used. + +int main(void) +{ + char* h = "hello, world"; + char* p = strdup(h); + char u[20]; + char* c __attribute__((unused)); + int len; + + len = strlen(p); + + c = strchr (p, 'l'); + c = strchr (p, 'x'); + + c = strrchr(p, 'l'); + c = strrchr(p, 'x'); + + c = memchr (p, 'l', len); // glibc version ok? + c = memchr (p, 'x', len); + + memcpy(u, p, len+1); // glibc version ok? + + return 0; +} diff --git a/exp-sgcheck/tests/strlen_bad.stderr.exp b/exp-sgcheck/tests/strlen_bad.stderr.exp new file mode 100644 index 00000000..eab9bb33 --- /dev/null +++ b/exp-sgcheck/tests/strlen_bad.stderr.exp @@ -0,0 +1,43 @@ + +Invalid read of size 4 + at 0x........: strlen (in /...libc...) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is 12 bytes inside the accessing pointer's + legitimate range, a block of size 13 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: __strdup (in /...libc...) + by 0x........: main (strlen.c:14) + +Invalid read of size 4 + at 0x........: strchr (in /...libc...) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is 12 bytes inside the accessing pointer's + legitimate range, a block of size 13 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: __strdup (in /...libc...) + by 0x........: main (strlen.c:14) + +Invalid read of size 4 + at 0x........: strrchr (in /...libc...) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is 12 bytes inside the accessing pointer's + legitimate range, a block of size 13 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: __strdup (in /...libc...) + by 0x........: main (strlen.c:14) + +Invalid read of size 4 + at 0x........: strrchr (in /...libc...) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is 12 bytes inside the accessing pointer's + legitimate range, a block of size 13 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: __strdup (in /...libc...) + by 0x........: main (strlen.c:14) + + +ERROR SUMMARY: 4 errors from 4 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/strlen_bad.vgtest-disabled b/exp-sgcheck/tests/strlen_bad.vgtest-disabled new file mode 100644 index 00000000..9f418726 --- /dev/null +++ b/exp-sgcheck/tests/strlen_bad.vgtest-disabled @@ -0,0 +1,2 @@ +prog: strlen +vgopts: --partial-loads-ok=no diff --git a/exp-sgcheck/tests/strlen_good.stderr.exp b/exp-sgcheck/tests/strlen_good.stderr.exp new file mode 100644 index 00000000..d18786f8 --- /dev/null +++ b/exp-sgcheck/tests/strlen_good.stderr.exp @@ -0,0 +1,3 @@ + + +ERROR SUMMARY: 0 errors from 0 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/strlen_good.vgtest-disabled b/exp-sgcheck/tests/strlen_good.vgtest-disabled new file mode 100644 index 00000000..14e36fa6 --- /dev/null +++ b/exp-sgcheck/tests/strlen_good.vgtest-disabled @@ -0,0 +1,2 @@ +prog: strlen +vgopts: --partial-loads-ok=yes diff --git a/exp-sgcheck/tests/sub.c b/exp-sgcheck/tests/sub.c new file mode 100644 index 00000000..73116b6f --- /dev/null +++ b/exp-sgcheck/tests/sub.c @@ -0,0 +1,41 @@ +#include <stdio.h> +#include <stdlib.h> +#include <signal.h> +#include <setjmp.h> +#include <assert.h> + +#include "arith_include1.c" +int aaa(void) { int x = 0x66; return x; } +int bbb(void) { return 0x55; } +int main(void) +{ + #include "arith_include2.c" + + // SUB ========================================================= + g(-, n, n2, n); // det, det // undet, undet? + + g(-, n, p, e); // det, det + + g(-, p, n, p); // ok, det + + g(-, p, pp, B); // det, det + + g(-, n, un, u); // undet, undet + g(-, n, up, u); // undet, undet + + g(-, un, n, u); // undet, undet + g(-, up, n, u); // ok, undet + + g(-, un, un2,u); // det, det + g(-, un, up, u); // undet, undet + g(-, up, un, u); // ok, undet + g(-, up, up, u); // det, det + + g(-, un, p, B); // undet, undet + g(-, up, p, B); // undet, undet + + g(-, p, un, p); // det, det + g(-, p, up, p); // det, det + + return 0; +} diff --git a/exp-sgcheck/tests/sub.stderr.exp b/exp-sgcheck/tests/sub.stderr.exp new file mode 100644 index 00000000..25997986 --- /dev/null +++ b/exp-sgcheck/tests/sub.stderr.exp @@ -0,0 +1,102 @@ + +about to do 15 [0] +Invalid read of size 4 + at 0x........: main (sub.c:15) + Address 0x........ is not derived from any known block +about to do 15 [-1] + +Invalid read of size 4 + at 0x........: main (sub.c:15) + Address 0x........ is not derived from any known block +about to do 17 [0] + +Invalid read of size 4 + at 0x........: main (sub.c:17) + Address 0x........ is not derived from any known block +about to do 17 [-1] + +Invalid read of size 4 + at 0x........: main (sub.c:17) + Address 0x........ is not derived from any known block +about to do 19 [0] +about to do 19 [-1] + +Invalid read of size 4 + at 0x........: main (sub.c:19) + Address 0x........ is 4 bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 21 [0] +about to do 21 [-1] +about to do 23 [0] +about to do 23 [-1] +about to do 24 [0] +about to do 24 [-1] +about to do 26 [0] +about to do 26 [-1] +about to do 27 [0] +about to do 27 [-1] +about to do 29 [0] + +Invalid read of size 4 + at 0x........: main (sub.c:29) + Address 0x........ is not derived from any known block +about to do 29 [-1] + +Invalid read of size 4 + at 0x........: main (sub.c:29) + Address 0x........ is not derived from any known block +about to do 30 [0] +about to do 30 [-1] +about to do 31 [0] +about to do 31 [-1] +about to do 32 [0] + +Invalid read of size 4 + at 0x........: main (sub.c:32) + Address 0x........ is not derived from any known block +about to do 32 [-1] + +Invalid read of size 4 + at 0x........: main (sub.c:32) + Address 0x........ is not derived from any known block +about to do 34 [0] +about to do 34 [-1] +about to do 35 [0] +about to do 35 [-1] +about to do 37 [0] + +Invalid read of size 4 + at 0x........: main (sub.c:37) + Address 0x........ is ... bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 37 [-1] + +Invalid read of size 4 + at 0x........: main (sub.c:37) + Address 0x........ is ... bytes before the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 38 [0] + +Invalid read of size 4 + at 0x........: main (sub.c:38) + Address 0x........ is ... bytes after the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) +about to do 38 [-1] + +Invalid read of size 4 + at 0x........: main (sub.c:38) + Address 0x........ is ... bytes after the accessing pointer's + legitimate range, a block of size 40 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (arith_include2.c:22) + + +ERROR SUMMARY: 13 errors from 13 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/sub.vgtest-disabled b/exp-sgcheck/tests/sub.vgtest-disabled new file mode 100644 index 00000000..45d1aeeb --- /dev/null +++ b/exp-sgcheck/tests/sub.vgtest-disabled @@ -0,0 +1,2 @@ +prog: sub +stderr_filter: filter_add diff --git a/exp-sgcheck/tests/supp.c b/exp-sgcheck/tests/supp.c new file mode 100644 index 00000000..97f77883 --- /dev/null +++ b/exp-sgcheck/tests/supp.c @@ -0,0 +1,19 @@ +#include <string.h> +#include <stdlib.h> +#include <unistd.h> +#include <sys/types.h> +#include <sys/stat.h> +#include <fcntl.h> +#include <sys/time.h> + +int main(void) +{ + int i = 11; int fd = open("/dev/null", O_WRONLY); + char* buf = malloc(sizeof(char) * 6); + char c = buf[-1]; // LoadStoreErr + char* x = buf + (long)buf; // ArithErr + char* y = (char*)((long)buf * i); // AsmErr + write(fd, buf+3, 5); // SysParamErr + close(fd); + return x-y+c; +} diff --git a/exp-sgcheck/tests/supp.stderr.exp b/exp-sgcheck/tests/supp.stderr.exp new file mode 100644 index 00000000..6c091767 --- /dev/null +++ b/exp-sgcheck/tests/supp.stderr.exp @@ -0,0 +1,11 @@ + +Syscall param write(buf) is non-contiguous + at 0x........: write (in /...libc...) + by 0x........: main (supp.c:16) + First byte (0x........) is 3 bytes inside a 6-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (supp.c:12) + Last byte is not inside a known block + + +ERROR SUMMARY: 1 errors from 1 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/supp.supp b/exp-sgcheck/tests/supp.supp new file mode 100644 index 00000000..9d3300a7 --- /dev/null +++ b/exp-sgcheck/tests/supp.supp @@ -0,0 +1,18 @@ +{ + first-in-supp.supp + exp-ptrcheck:Heap + fun:main +} +{ + second-in-supp.supp + exp-ptrcheck:Arith + fun:main +} +{ + third-in-supp.supp + exp-ptrcheck:SysParam + write(buf) + fun:__GI___libc_write + fun:__libc_start_main + obj:*/annelid/tests/supp +} diff --git a/exp-sgcheck/tests/supp.vgtest b/exp-sgcheck/tests/supp.vgtest new file mode 100644 index 00000000..b991f572 --- /dev/null +++ b/exp-sgcheck/tests/supp.vgtest @@ -0,0 +1,3 @@ +prereq: ./is_arch_supported +vgopts: --suppressions=supp.supp +prog: supp diff --git a/exp-sgcheck/tests/suppgen.stderr.exp b/exp-sgcheck/tests/suppgen.stderr.exp new file mode 100644 index 00000000..879fb2bf --- /dev/null +++ b/exp-sgcheck/tests/suppgen.stderr.exp @@ -0,0 +1,61 @@ + +Invalid read of size 1 + at 0x........: main (supp.c:13) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is 1 bytes before the accessing pointer's + legitimate range, the 6-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (supp.c:12) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + +---- Print suppression ? --- [Return/N/n/Y/y/C/c] ---- { + <insert a suppression name here> + Annelid:LoadStore + fun:main + fun:__libc_start_main + obj:*/annelid/tests/supp +} + +Invalid ADD + at 0x........: main (supp.c:14) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Both args derived from address 0x........ of 6-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (supp.c:12) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + +---- Print suppression ? --- [Return/N/n/Y/y/C/c] ---- { + <insert a suppression name here> + Annelid:Arith + fun:main + fun:__libc_start_main + obj:*/annelid/tests/supp +} +Warning: invalid file descriptor -1 in syscall write() + +Syscall param write(buf) is non-contiguous + at 0x........: __libc_write (...libc...) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First byte (0x........) is 3 bytes within a 6-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (supp.c:12) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Last byte is not within a known block + +---- Print suppression ? --- [Return/N/n/Y/y/C/c] ---- { + <insert a suppression name here> + Annelid:SysParam + write(buf) + fun:__GI___libc_write + fun:__libc_start_main + obj:*/annelid/tests/supp +} + + +ERROR SUMMARY: 3 errors from 3 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/suppgen.stdin b/exp-sgcheck/tests/suppgen.stdin new file mode 100644 index 00000000..b469f970 --- /dev/null +++ b/exp-sgcheck/tests/suppgen.stdin @@ -0,0 +1,5 @@ +y +y +y +y + diff --git a/exp-sgcheck/tests/suppgen.vgtest-disabled b/exp-sgcheck/tests/suppgen.vgtest-disabled new file mode 100644 index 00000000..d606f2a8 --- /dev/null +++ b/exp-sgcheck/tests/suppgen.vgtest-disabled @@ -0,0 +1,4 @@ +prog: supp +vgopts: --gen-suppressions=yes +args: < suppgen.stdin +stderr_filter: filter_suppgen diff --git a/exp-sgcheck/tests/syscall.c b/exp-sgcheck/tests/syscall.c new file mode 100644 index 00000000..b446275b --- /dev/null +++ b/exp-sgcheck/tests/syscall.c @@ -0,0 +1,59 @@ +#include <string.h> +#include <stdlib.h> +#include <unistd.h> +#include <sys/types.h> +#include <sys/stat.h> +#include <fcntl.h> +#include <sys/time.h> + +// For some reason, the stack frame below __GI_write is disappearing. +// Therefore, if I don't want the write errors to be merged, I have to +// ensure they have a different stack trace. I do this by using this +// function. Weird. +__attribute__((noinline)) +void mywrite(char* buf, int len) +{ + write(-1, buf, len); +} + +__attribute__((noinline)) +void mygetitimer(long arg1, struct itimerval* itval) +{ + getitimer(arg1, itval); +} + +__attribute__((noinline)) +void myopen(char* name, long flags) +{ + open(name, flags); +} + +int main(void) +{ + char *buf = malloc(sizeof(char)*6), *buf2 = malloc(sizeof(char)*6); + struct itimerval* itval = malloc(sizeof(struct itimerval) - 1); + int diff = buf2 - buf; + buf[0] = 'h'; + buf[1] = 'e'; + buf[2] = 'l'; + buf[3] = 'l'; + buf[4] = 'o'; + buf[5] = 'x'; + + // error (read) (will fail due to -1, as we want -- don't want any + // unpredictable output to foul up the test) + mywrite(buf+3, 5); // error (read) + mywrite(buf-1, 5); // error (read) + mywrite(buf+1, diff); // error (read) + myopen(buf+3, 0x0); // error (read_asciiz) + + mygetitimer(0, itval); // error (write) + + //---- + free(buf); + mywrite(buf, 5); // error + mywrite(buf+3, 5); // error + mywrite(buf+1, diff); // error (read) + + return 0; +} diff --git a/exp-sgcheck/tests/syscall.stderr.exp b/exp-sgcheck/tests/syscall.stderr.exp new file mode 100644 index 00000000..e3638299 --- /dev/null +++ b/exp-sgcheck/tests/syscall.stderr.exp @@ -0,0 +1,110 @@ + +Warning: invalid file descriptor -1 in syscall write() +Syscall param write(buf) is non-contiguous + at 0x........: __libc_write (...libc...) + by 0x........: main (syscall.c:32) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First byte (0x........) is 3 bytes within a 6-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (syscall.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Last byte is not within a known block +Warning: invalid file descriptor -1 in syscall write() + +Syscall param write(buf) is non-contiguous + at 0x........: __libc_write (...libc...) + by 0x........: main (syscall.c:33) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First byte is not within a known block +Last byte (0x........) is 3 bytes within a 6-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (syscall.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Warning: invalid file descriptor -1 in syscall write() + +Syscall param write(buf) is non-contiguous + at 0x........: __libc_write (...libc...) + by 0x........: main (syscall.c:34) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First byte (0x........) is 1 bytes within a 6-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (syscall.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Last byte (0x........) is 0 bytes within a 6-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (syscall.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + +Syscall param open(pathname) is non-contiguous + at 0x........: __libc_open (...libc...) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First byte (0x........) is 3 bytes within a 6-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (syscall.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Last byte is not within a known block + +Syscall param getitimer(timer) is non-contiguous + at 0x........: __getitimer (in /...libc...) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First byte (0x........) is 0 bytes within a 15-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (syscall.c:21) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Last byte is not within a known block +Warning: invalid file descriptor -1 in syscall write() + +Syscall param write(buf) contains unaddressable byte(s) + at 0x........: __libc_write (...libc...) + by 0x........: main (syscall.c:41) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Address 0x........ is 0 bytes within a 6-byte block free'd + at 0x........: free (vg_replace_malloc.c:...) + by 0x........: main (syscall.c:40) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Warning: invalid file descriptor -1 in syscall write() + +Syscall param write(buf) is non-contiguous + at 0x........: __libc_write (...libc...) + by 0x........: main (syscall.c:42) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First byte (0x........) is 3 bytes within a 6-byte block free'd + at 0x........: free (vg_replace_malloc.c:...) + by 0x........: main (syscall.c:40) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Last byte is not within a known block +Warning: invalid file descriptor -1 in syscall write() + +Syscall param write(buf) is non-contiguous + at 0x........: __libc_write (...libc...) + by 0x........: main (syscall.c:43) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +First byte (0x........) is 1 bytes within a 6-byte block free'd + at 0x........: free (vg_replace_malloc.c:...) + by 0x........: main (syscall.c:40) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... +Last byte (0x........) is 0 bytes within a 6-byte block alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (syscall.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + + +ERROR SUMMARY: 8 errors from 8 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/syscall.vgtest-disabled b/exp-sgcheck/tests/syscall.vgtest-disabled new file mode 100644 index 00000000..ea58a588 --- /dev/null +++ b/exp-sgcheck/tests/syscall.vgtest-disabled @@ -0,0 +1 @@ +prog: syscall diff --git a/exp-sgcheck/tests/tricky.c b/exp-sgcheck/tests/tricky.c new file mode 100644 index 00000000..624f9e4a --- /dev/null +++ b/exp-sgcheck/tests/tricky.c @@ -0,0 +1,20 @@ + +#include <stdlib.h> + +int main(void) +{ + // When I had n-u --> u, this gave a false positive... can happen because + // p+up can give n if you are (un)lucky, because the result is close enough + // to zero. + int u[20]; + int* p = malloc(sizeof(int) * 100); + int* n; + int* x; + + p[0] = 0; // ok + n = (int*)((long)p + (long)u); // result is n, because near zero! + x = (int*)((long)n - (long)u); // x == p + x[0] = 0; // ok, originally caused false pos. + + return 0; +} diff --git a/exp-sgcheck/tests/tricky.stderr.exp b/exp-sgcheck/tests/tricky.stderr.exp new file mode 100644 index 00000000..d18786f8 --- /dev/null +++ b/exp-sgcheck/tests/tricky.stderr.exp @@ -0,0 +1,3 @@ + + +ERROR SUMMARY: 0 errors from 0 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/tricky.vgtest b/exp-sgcheck/tests/tricky.vgtest new file mode 100644 index 00000000..8ebfc09f --- /dev/null +++ b/exp-sgcheck/tests/tricky.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: tricky diff --git a/exp-sgcheck/tests/unaligned.c b/exp-sgcheck/tests/unaligned.c new file mode 100644 index 00000000..6c7ba39d --- /dev/null +++ b/exp-sgcheck/tests/unaligned.c @@ -0,0 +1,51 @@ + +#include <stdio.h> +#include <stdlib.h> +#include <string.h> + +int main ( void ) +{ + char* x = strdup("hello"); + char c __attribute__((unused)); + char c0[8], c1[8], c2[8], c3[8], c4[8]; + + // Each of these pointers has a different alignment + char** p0 = (char**)&c0[0]; char** p1 = (char**)&c1[1]; + char** p2 = (char**)&c2[2]; char** p3 = (char**)&c3[3]; + char** p4 = (char**)&c4[4]; + *p0 = x; *p1 = x; *p2 = x; + *p3 = x; *p4 = x; + + // These 10 are ok + c = (*p0)[0]; + c = (*p1)[0]; + c = (*p2)[0]; + c = (*p3)[0]; + c = (*p4)[0]; + + c = (*p0)[5]; + c = (*p1)[5]; + c = (*p2)[5]; + c = (*p3)[5]; + c = (*p4)[5]; + + // These 10 are bad + c = (*p0)[-1]; // always word aligned, so det + c = (*p1)[-1]; // undet + c = (*p2)[-1]; // undet + c = (*p3)[-1]; // undet + c = (*p4)[-1]; // undet on 64-bit since not 64-bit aligned + + c = (*p0)[6]; // always word aligned, so det + c = (*p1)[6]; // undet + c = (*p2)[6]; // undet + c = (*p3)[6]; // undet + c = (*p4)[6]; // undet on 64-bit since not 64-bit aligned + + return 0; +} + +/* What this program does: verifies that (unfortunately) if you store a + pointer misaligned, then the associated shadow value decays to Unknown, + and so when you retrieve the pointer later and dereference it, you + get no check :-( */ diff --git a/exp-sgcheck/tests/unaligned.stderr.exp-glibc25-amd64 b/exp-sgcheck/tests/unaligned.stderr.exp-glibc25-amd64 new file mode 100644 index 00000000..47696801 --- /dev/null +++ b/exp-sgcheck/tests/unaligned.stderr.exp-glibc25-amd64 @@ -0,0 +1,19 @@ + +Invalid read of size 1 + at 0x........: main (unaligned.c:33) + Address 0x........ is 1 bytes before the accessing pointer's + legitimate range, a block of size 6 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: ... + by 0x........: main (unaligned.c:8) + +Invalid read of size 1 + at 0x........: main (unaligned.c:39) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 6 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: ... + by 0x........: main (unaligned.c:8) + + +ERROR SUMMARY: 2 errors from 2 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/unaligned.stderr.exp-glibc25-x86 b/exp-sgcheck/tests/unaligned.stderr.exp-glibc25-x86 new file mode 100644 index 00000000..55002a23 --- /dev/null +++ b/exp-sgcheck/tests/unaligned.stderr.exp-glibc25-x86 @@ -0,0 +1,35 @@ + +Invalid read of size 1 + at 0x........: main (unaligned.c:33) + Address 0x........ is 1 bytes before the accessing pointer's + legitimate range, a block of size 6 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: ... + by 0x........: main (unaligned.c:8) + +Invalid read of size 1 + at 0x........: main (unaligned.c:37) + Address 0x........ is 1 bytes before the accessing pointer's + legitimate range, a block of size 6 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: ... + by 0x........: main (unaligned.c:8) + +Invalid read of size 1 + at 0x........: main (unaligned.c:39) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 6 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: ... + by 0x........: main (unaligned.c:8) + +Invalid read of size 1 + at 0x........: main (unaligned.c:43) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 6 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: ... + by 0x........: main (unaligned.c:8) + + +ERROR SUMMARY: 4 errors from 4 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/unaligned.vgtest b/exp-sgcheck/tests/unaligned.vgtest new file mode 100644 index 00000000..240dc60a --- /dev/null +++ b/exp-sgcheck/tests/unaligned.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: unaligned diff --git a/exp-sgcheck/tests/xor.c b/exp-sgcheck/tests/xor.c new file mode 100644 index 00000000..7e3bade1 --- /dev/null +++ b/exp-sgcheck/tests/xor.c @@ -0,0 +1,40 @@ +#include <stdio.h> +#include <stdlib.h> +#include <signal.h> +#include <setjmp.h> +#include <assert.h> + +#include "arith_include1.c" + +int main(void) +{ + #include "arith_include2.c" + + // XOR ========================================================= + g(^, n, n, n); // det, det + + g(^, n, p, u); // ok, undet + + g(^, p, n, u); // ok, undet + + g(^, p, p, n); // det, det + + g(^, n, un, u); // undet, undet + g(^, n, up, u); // ok, undet + + g(^, un, n, u); // undet, undet + g(^, up, n, u); // ok, undet + + g(^, un, un, n); // det, det (range) + g(^, un, up, u); // ok, undet + g(^, up, un, u); // ok, undet + g(^, up, up, n); // det, det + + g(^, un, p, u); // ok, undet + g(^, up, p, u); // undet, undet + + g(^, p, un, u); // ok, undet + g(^, p, up, u); // undet, undet + + return 0; +} diff --git a/exp-sgcheck/tests/xor.stderr.exp b/exp-sgcheck/tests/xor.stderr.exp new file mode 100644 index 00000000..ff28a84a --- /dev/null +++ b/exp-sgcheck/tests/xor.stderr.exp @@ -0,0 +1,83 @@ + +about to do 14 [0] +Invalid read of size 4 + at 0x........: main (xor.c:14) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is not derived from any known block +about to do 14 [-1] + +Invalid read of size 4 + at 0x........: main (xor.c:14) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is not derived from any known block +about to do 16 [0] +about to do 16 [-1] +about to do 18 [0] +about to do 18 [-1] +about to do 20 [0] + +Invalid read of size 4 + at 0x........: main (xor.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is not derived from any known block +about to do 20 [-1] + +Invalid read of size 4 + at 0x........: main (xor.c:20) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is not derived from any known block +about to do 22 [0] +about to do 22 [-1] +about to do 23 [0] +about to do 23 [-1] +about to do 25 [0] +about to do 25 [-1] +about to do 26 [0] +about to do 26 [-1] +about to do 28 [0] + +Invalid read of size 4 + at 0x........: main (xor.c:28) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is not derived from any known block +about to do 28 [-1] + +Invalid read of size 4 + at 0x........: main (xor.c:28) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is not derived from any known block +about to do 29 [0] +about to do 29 [-1] +about to do 30 [0] +about to do 30 [-1] +about to do 31 [0] + +Invalid read of size 4 + at 0x........: main (xor.c:31) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is not derived from any known block +about to do 31 [-1] + +Invalid read of size 4 + at 0x........: main (xor.c:31) + by 0x........: __libc_start_main (...libc...) + by 0x........: ... + Address 0x........ is not derived from any known block +about to do 33 [0] +about to do 33 [-1] +about to do 34 [0] +about to do 34 [-1] +about to do 36 [0] +about to do 36 [-1] +about to do 37 [0] +about to do 37 [-1] + + +ERROR SUMMARY: 8 errors from 8 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/xor.vgtest-disabled b/exp-sgcheck/tests/xor.vgtest-disabled new file mode 100644 index 00000000..8d60202e --- /dev/null +++ b/exp-sgcheck/tests/xor.vgtest-disabled @@ -0,0 +1,2 @@ +prog: xor +stderr_filter: filter_add diff --git a/exp-sgcheck/tests/zero.c b/exp-sgcheck/tests/zero.c new file mode 100644 index 00000000..7077bb44 --- /dev/null +++ b/exp-sgcheck/tests/zero.c @@ -0,0 +1,24 @@ + + +#include <stdlib.h> +#include <assert.h> + +int main ( void ) +{ + char c __attribute__((unused)), *c0 = malloc(0), *c1; + + c = *c0; // bad + + c0 = realloc(c0, 10); + assert(c0); + + c = *c0; // ok + + c1 = c0; + c0 = realloc(c0, 0); + assert(!c0); + + c = *c1; // bad, dangling + + return 0; +} diff --git a/exp-sgcheck/tests/zero.stderr.exp b/exp-sgcheck/tests/zero.stderr.exp new file mode 100644 index 00000000..0da65fef --- /dev/null +++ b/exp-sgcheck/tests/zero.stderr.exp @@ -0,0 +1,18 @@ + +Invalid read of size 1 + at 0x........: main (zero.c:10) + Address 0x........ is 0 bytes after the accessing pointer's + legitimate range, a block of size 0 alloc'd + at 0x........: malloc (vg_replace_malloc.c:...) + by 0x........: main (zero.c:8) + +Invalid read of size 1 + at 0x........: main (zero.c:21) + Address 0x........ is 0 bytes inside the accessing pointer's + once-legitimate range, a block of size 10 free'd + at 0x........: free (vg_replace_malloc.c:...) + by 0x........: realloc (vg_replace_malloc.c:...) + by 0x........: main (zero.c:18) + + +ERROR SUMMARY: 2 errors from 2 contexts (suppressed: 0 from 0) diff --git a/exp-sgcheck/tests/zero.vgtest b/exp-sgcheck/tests/zero.vgtest new file mode 100644 index 00000000..3d6333c4 --- /dev/null +++ b/exp-sgcheck/tests/zero.vgtest @@ -0,0 +1,2 @@ +prereq: ./is_arch_supported +prog: zero |