| // Copyright 2010 The Go Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style |
| // license that can be found in the LICENSE file. |
| |
| package zip |
| |
| import ( |
| "bytes" |
| "encoding/binary" |
| "encoding/hex" |
| "io" |
| "io/ioutil" |
| "os" |
| "path/filepath" |
| "regexp" |
| "testing" |
| "time" |
| ) |
| |
| type ZipTest struct { |
| Name string |
| Source func() (r io.ReaderAt, size int64) // if non-nil, used instead of testdata/<Name> file |
| Comment string |
| File []ZipTestFile |
| Error error // the error that Opening this file should return |
| } |
| |
| type ZipTestFile struct { |
| Name string |
| Content []byte // if blank, will attempt to compare against File |
| ContentErr error |
| File string // name of file to compare to (relative to testdata/) |
| Mtime string // modified time in format "mm-dd-yy hh:mm:ss" |
| Mode os.FileMode |
| } |
| |
| // Caution: The Mtime values found for the test files should correspond to |
| // the values listed with unzip -l <zipfile>. However, the values |
| // listed by unzip appear to be off by some hours. When creating |
| // fresh test files and testing them, this issue is not present. |
| // The test files were created in Sydney, so there might be a time |
| // zone issue. The time zone information does have to be encoded |
| // somewhere, because otherwise unzip -l could not provide a different |
| // time from what the archive/zip package provides, but there appears |
| // to be no documentation about this. |
| |
| var tests = []ZipTest{ |
| { |
| Name: "test.zip", |
| Comment: "This is a zipfile comment.", |
| File: []ZipTestFile{ |
| { |
| Name: "test.txt", |
| Content: []byte("This is a test text file.\n"), |
| Mtime: "09-05-10 12:12:02", |
| Mode: 0644, |
| }, |
| { |
| Name: "gophercolor16x16.png", |
| File: "gophercolor16x16.png", |
| Mtime: "09-05-10 15:52:58", |
| Mode: 0644, |
| }, |
| }, |
| }, |
| { |
| Name: "r.zip", |
| Source: returnRecursiveZip, |
| File: []ZipTestFile{ |
| { |
| Name: "r/r.zip", |
| Content: rZipBytes(), |
| Mtime: "03-04-10 00:24:16", |
| Mode: 0666, |
| }, |
| }, |
| }, |
| { |
| Name: "symlink.zip", |
| File: []ZipTestFile{ |
| { |
| Name: "symlink", |
| Content: []byte("../target"), |
| Mode: 0777 | os.ModeSymlink, |
| }, |
| }, |
| }, |
| { |
| Name: "readme.zip", |
| }, |
| { |
| Name: "readme.notzip", |
| Error: ErrFormat, |
| }, |
| { |
| Name: "dd.zip", |
| File: []ZipTestFile{ |
| { |
| Name: "filename", |
| Content: []byte("This is a test textfile.\n"), |
| Mtime: "02-02-11 13:06:20", |
| Mode: 0666, |
| }, |
| }, |
| }, |
| { |
| // created in windows XP file manager. |
| Name: "winxp.zip", |
| File: crossPlatform, |
| }, |
| { |
| // created by Zip 3.0 under Linux |
| Name: "unix.zip", |
| File: crossPlatform, |
| }, |
| { |
| // created by Go, before we wrote the "optional" data |
| // descriptor signatures (which are required by OS X) |
| Name: "go-no-datadesc-sig.zip", |
| File: []ZipTestFile{ |
| { |
| Name: "foo.txt", |
| Content: []byte("foo\n"), |
| Mtime: "03-08-12 16:59:10", |
| Mode: 0644, |
| }, |
| { |
| Name: "bar.txt", |
| Content: []byte("bar\n"), |
| Mtime: "03-08-12 16:59:12", |
| Mode: 0644, |
| }, |
| }, |
| }, |
| { |
| // created by Go, after we wrote the "optional" data |
| // descriptor signatures (which are required by OS X) |
| Name: "go-with-datadesc-sig.zip", |
| File: []ZipTestFile{ |
| { |
| Name: "foo.txt", |
| Content: []byte("foo\n"), |
| Mode: 0666, |
| }, |
| { |
| Name: "bar.txt", |
| Content: []byte("bar\n"), |
| Mode: 0666, |
| }, |
| }, |
| }, |
| { |
| Name: "Bad-CRC32-in-data-descriptor", |
| Source: returnCorruptCRC32Zip, |
| File: []ZipTestFile{ |
| { |
| Name: "foo.txt", |
| Content: []byte("foo\n"), |
| Mode: 0666, |
| ContentErr: ErrChecksum, |
| }, |
| { |
| Name: "bar.txt", |
| Content: []byte("bar\n"), |
| Mode: 0666, |
| }, |
| }, |
| }, |
| // Tests that we verify (and accept valid) crc32s on files |
| // with crc32s in their file header (not in data descriptors) |
| { |
| Name: "crc32-not-streamed.zip", |
| File: []ZipTestFile{ |
| { |
| Name: "foo.txt", |
| Content: []byte("foo\n"), |
| Mtime: "03-08-12 16:59:10", |
| Mode: 0644, |
| }, |
| { |
| Name: "bar.txt", |
| Content: []byte("bar\n"), |
| Mtime: "03-08-12 16:59:12", |
| Mode: 0644, |
| }, |
| }, |
| }, |
| // Tests that we verify (and reject invalid) crc32s on files |
| // with crc32s in their file header (not in data descriptors) |
| { |
| Name: "crc32-not-streamed.zip", |
| Source: returnCorruptNotStreamedZip, |
| File: []ZipTestFile{ |
| { |
| Name: "foo.txt", |
| Content: []byte("foo\n"), |
| Mtime: "03-08-12 16:59:10", |
| Mode: 0644, |
| ContentErr: ErrChecksum, |
| }, |
| { |
| Name: "bar.txt", |
| Content: []byte("bar\n"), |
| Mtime: "03-08-12 16:59:12", |
| Mode: 0644, |
| }, |
| }, |
| }, |
| { |
| Name: "zip64.zip", |
| File: []ZipTestFile{ |
| { |
| Name: "README", |
| Content: []byte("This small file is in ZIP64 format.\n"), |
| Mtime: "08-10-12 14:33:32", |
| Mode: 0644, |
| }, |
| }, |
| }, |
| } |
| |
| var crossPlatform = []ZipTestFile{ |
| { |
| Name: "hello", |
| Content: []byte("world \r\n"), |
| Mode: 0666, |
| }, |
| { |
| Name: "dir/bar", |
| Content: []byte("foo \r\n"), |
| Mode: 0666, |
| }, |
| { |
| Name: "dir/empty/", |
| Content: []byte{}, |
| Mode: os.ModeDir | 0777, |
| }, |
| { |
| Name: "readonly", |
| Content: []byte("important \r\n"), |
| Mode: 0444, |
| }, |
| } |
| |
| func TestReader(t *testing.T) { |
| for _, zt := range tests { |
| readTestZip(t, zt) |
| } |
| } |
| |
| func readTestZip(t *testing.T, zt ZipTest) { |
| var z *Reader |
| var err error |
| if zt.Source != nil { |
| rat, size := zt.Source() |
| z, err = NewReader(rat, size) |
| } else { |
| var rc *ReadCloser |
| rc, err = OpenReader(filepath.Join("testdata", zt.Name)) |
| if err == nil { |
| z = &rc.Reader |
| } |
| } |
| if err != zt.Error { |
| t.Errorf("error=%v, want %v", err, zt.Error) |
| return |
| } |
| |
| // bail if file is not zip |
| if err == ErrFormat { |
| return |
| } |
| |
| // bail here if no Files expected to be tested |
| // (there may actually be files in the zip, but we don't care) |
| if zt.File == nil { |
| return |
| } |
| |
| if z.Comment != zt.Comment { |
| t.Errorf("%s: comment=%q, want %q", zt.Name, z.Comment, zt.Comment) |
| } |
| if len(z.File) != len(zt.File) { |
| t.Fatalf("%s: file count=%d, want %d", zt.Name, len(z.File), len(zt.File)) |
| } |
| |
| // test read of each file |
| for i, ft := range zt.File { |
| readTestFile(t, zt, ft, z.File[i]) |
| } |
| |
| // test simultaneous reads |
| n := 0 |
| done := make(chan bool) |
| for i := 0; i < 5; i++ { |
| for j, ft := range zt.File { |
| go func(j int, ft ZipTestFile) { |
| readTestFile(t, zt, ft, z.File[j]) |
| done <- true |
| }(j, ft) |
| n++ |
| } |
| } |
| for ; n > 0; n-- { |
| <-done |
| } |
| } |
| |
| func readTestFile(t *testing.T, zt ZipTest, ft ZipTestFile, f *File) { |
| if f.Name != ft.Name { |
| t.Errorf("%s: name=%q, want %q", zt.Name, f.Name, ft.Name) |
| } |
| |
| if ft.Mtime != "" { |
| mtime, err := time.Parse("01-02-06 15:04:05", ft.Mtime) |
| if err != nil { |
| t.Error(err) |
| return |
| } |
| if ft := f.ModTime(); !ft.Equal(mtime) { |
| t.Errorf("%s: %s: mtime=%s, want %s", zt.Name, f.Name, ft, mtime) |
| } |
| } |
| |
| testFileMode(t, zt.Name, f, ft.Mode) |
| |
| size0 := f.UncompressedSize |
| |
| var b bytes.Buffer |
| r, err := f.Open() |
| if err != nil { |
| t.Error(err) |
| return |
| } |
| |
| if size1 := f.UncompressedSize; size0 != size1 { |
| t.Errorf("file %q changed f.UncompressedSize from %d to %d", f.Name, size0, size1) |
| } |
| |
| _, err = io.Copy(&b, r) |
| if err != ft.ContentErr { |
| t.Errorf("%s: copying contents: %v (want %v)", zt.Name, err, ft.ContentErr) |
| } |
| if err != nil { |
| return |
| } |
| r.Close() |
| |
| var c []byte |
| if ft.Content != nil { |
| c = ft.Content |
| } else if c, err = ioutil.ReadFile("testdata/" + ft.File); err != nil { |
| t.Error(err) |
| return |
| } |
| |
| if b.Len() != len(c) { |
| t.Errorf("%s: len=%d, want %d", f.Name, b.Len(), len(c)) |
| return |
| } |
| |
| for i, b := range b.Bytes() { |
| if b != c[i] { |
| t.Errorf("%s: content[%d]=%q want %q", f.Name, i, b, c[i]) |
| return |
| } |
| } |
| } |
| |
| func testFileMode(t *testing.T, zipName string, f *File, want os.FileMode) { |
| mode := f.Mode() |
| if want == 0 { |
| t.Errorf("%s: %s mode: got %v, want none", zipName, f.Name, mode) |
| } else if mode != want { |
| t.Errorf("%s: %s mode: want %v, got %v", zipName, f.Name, want, mode) |
| } |
| } |
| |
| func TestInvalidFiles(t *testing.T) { |
| const size = 1024 * 70 // 70kb |
| b := make([]byte, size) |
| |
| // zeroes |
| _, err := NewReader(bytes.NewReader(b), size) |
| if err != ErrFormat { |
| t.Errorf("zeroes: error=%v, want %v", err, ErrFormat) |
| } |
| |
| // repeated directoryEndSignatures |
| sig := make([]byte, 4) |
| binary.LittleEndian.PutUint32(sig, directoryEndSignature) |
| for i := 0; i < size-4; i += 4 { |
| copy(b[i:i+4], sig) |
| } |
| _, err = NewReader(bytes.NewReader(b), size) |
| if err != ErrFormat { |
| t.Errorf("sigs: error=%v, want %v", err, ErrFormat) |
| } |
| } |
| |
| func messWith(fileName string, corrupter func(b []byte)) (r io.ReaderAt, size int64) { |
| data, err := ioutil.ReadFile(filepath.Join("testdata", fileName)) |
| if err != nil { |
| panic("Error reading " + fileName + ": " + err.Error()) |
| } |
| corrupter(data) |
| return bytes.NewReader(data), int64(len(data)) |
| } |
| |
| func returnCorruptCRC32Zip() (r io.ReaderAt, size int64) { |
| return messWith("go-with-datadesc-sig.zip", func(b []byte) { |
| // Corrupt one of the CRC32s in the data descriptor: |
| b[0x2d]++ |
| }) |
| } |
| |
| func returnCorruptNotStreamedZip() (r io.ReaderAt, size int64) { |
| return messWith("crc32-not-streamed.zip", func(b []byte) { |
| // Corrupt foo.txt's final crc32 byte, in both |
| // the file header and TOC. (0x7e -> 0x7f) |
| b[0x11]++ |
| b[0x9d]++ |
| |
| // TODO(bradfitz): add a new test that only corrupts |
| // one of these values, and verify that that's also an |
| // error. Currently, the reader code doesn't verify the |
| // fileheader and TOC's crc32 match if they're both |
| // non-zero and only the second line above, the TOC, |
| // is what matters. |
| }) |
| } |
| |
| // rZipBytes returns the bytes of a recursive zip file, without |
| // putting it on disk and triggering certain virus scanners. |
| func rZipBytes() []byte { |
| s := ` |
| 0000000 50 4b 03 04 14 00 00 00 08 00 08 03 64 3c f9 f4 |
| 0000010 89 64 48 01 00 00 b8 01 00 00 07 00 00 00 72 2f |
| 0000020 72 2e 7a 69 70 00 25 00 da ff 50 4b 03 04 14 00 |
| 0000030 00 00 08 00 08 03 64 3c f9 f4 89 64 48 01 00 00 |
| 0000040 b8 01 00 00 07 00 00 00 72 2f 72 2e 7a 69 70 00 |
| 0000050 2f 00 d0 ff 00 25 00 da ff 50 4b 03 04 14 00 00 |
| 0000060 00 08 00 08 03 64 3c f9 f4 89 64 48 01 00 00 b8 |
| 0000070 01 00 00 07 00 00 00 72 2f 72 2e 7a 69 70 00 2f |
| 0000080 00 d0 ff c2 54 8e 57 39 00 05 00 fa ff c2 54 8e |
| 0000090 57 39 00 05 00 fa ff 00 05 00 fa ff 00 14 00 eb |
| 00000a0 ff c2 54 8e 57 39 00 05 00 fa ff 00 05 00 fa ff |
| 00000b0 00 14 00 eb ff 42 88 21 c4 00 00 14 00 eb ff 42 |
| 00000c0 88 21 c4 00 00 14 00 eb ff 42 88 21 c4 00 00 14 |
| 00000d0 00 eb ff 42 88 21 c4 00 00 14 00 eb ff 42 88 21 |
| 00000e0 c4 00 00 00 00 ff ff 00 00 00 ff ff 00 34 00 cb |
| 00000f0 ff 42 88 21 c4 00 00 00 00 ff ff 00 00 00 ff ff |
| 0000100 00 34 00 cb ff 42 e8 21 5e 0f 00 00 00 ff ff 0a |
| 0000110 f0 66 64 12 61 c0 15 dc e8 a0 48 bf 48 af 2a b3 |
| 0000120 20 c0 9b 95 0d c4 67 04 42 53 06 06 06 40 00 06 |
| 0000130 00 f9 ff 6d 01 00 00 00 00 42 e8 21 5e 0f 00 00 |
| 0000140 00 ff ff 0a f0 66 64 12 61 c0 15 dc e8 a0 48 bf |
| 0000150 48 af 2a b3 20 c0 9b 95 0d c4 67 04 42 53 06 06 |
| 0000160 06 40 00 06 00 f9 ff 6d 01 00 00 00 00 50 4b 01 |
| 0000170 02 14 00 14 00 00 00 08 00 08 03 64 3c f9 f4 89 |
| 0000180 64 48 01 00 00 b8 01 00 00 07 00 00 00 00 00 00 |
| 0000190 00 00 00 00 00 00 00 00 00 00 00 72 2f 72 2e 7a |
| 00001a0 69 70 50 4b 05 06 00 00 00 00 01 00 01 00 35 00 |
| 00001b0 00 00 6d 01 00 00 00 00` |
| s = regexp.MustCompile(`[0-9a-f]{7}`).ReplaceAllString(s, "") |
| s = regexp.MustCompile(`\s+`).ReplaceAllString(s, "") |
| b, err := hex.DecodeString(s) |
| if err != nil { |
| panic(err) |
| } |
| return b |
| } |
| |
| func returnRecursiveZip() (r io.ReaderAt, size int64) { |
| b := rZipBytes() |
| return bytes.NewReader(b), int64(len(b)) |
| } |