blob: 7eebf06ed8ae9184ecc41f85fee2dad8985d3611 [file] [log] [blame]
Colin Cross2fe66872015-03-30 17:20:39 -07001// Copyright 2015 Google Inc. All rights reserved.
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7// http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
Jeff Gaston11b5c512017-10-12 12:19:14 -070015package zip
Colin Cross2fe66872015-03-30 17:20:39 -070016
17import (
Dan Willemsen017d8932016-08-04 15:43:03 -070018 "bytes"
19 "compress/flate"
Jeff Gastona2976952017-08-22 17:51:25 -070020 "errors"
Colin Cross2fe66872015-03-30 17:20:39 -070021 "fmt"
Dan Willemsen017d8932016-08-04 15:43:03 -070022 "hash/crc32"
Colin Cross2fe66872015-03-30 17:20:39 -070023 "io"
24 "io/ioutil"
25 "os"
26 "path/filepath"
Jeff Gastona2976952017-08-22 17:51:25 -070027 "sort"
Colin Cross2fe66872015-03-30 17:20:39 -070028 "strings"
Dan Willemsen017d8932016-08-04 15:43:03 -070029 "sync"
Colin Cross1d98ee22018-09-18 17:05:15 -070030 "syscall"
Colin Cross2fe66872015-03-30 17:20:39 -070031 "time"
Nan Zhang674dd932018-01-26 18:30:36 -080032 "unicode"
Dan Willemsen017d8932016-08-04 15:43:03 -070033
Colin Crossf83c1502017-11-10 13:11:02 -080034 "github.com/google/blueprint/pathtools"
35
Jeff Gastona2976952017-08-22 17:51:25 -070036 "android/soong/jar"
Dan Willemsen017d8932016-08-04 15:43:03 -070037 "android/soong/third_party/zip"
Colin Cross2fe66872015-03-30 17:20:39 -070038)
39
Dan Willemsen017d8932016-08-04 15:43:03 -070040// Block size used during parallel compression of a single file.
41const parallelBlockSize = 1 * 1024 * 1024 // 1MB
42
43// Minimum file size to use parallel compression. It requires more
44// flate.Writer allocations, since we can't change the dictionary
45// during Reset
46const minParallelFileSize = parallelBlockSize * 6
47
48// Size of the ZIP compression window (32KB)
49const windowSize = 32 * 1024
50
51type nopCloser struct {
52 io.Writer
53}
54
55func (nopCloser) Close() error {
56 return nil
57}
58
Jeff Gastoncef50b92017-08-23 15:41:35 -070059type byteReaderCloser struct {
Colin Cross635acc92017-09-12 22:50:46 -070060 *bytes.Reader
Jeff Gastoncef50b92017-08-23 15:41:35 -070061 io.Closer
62}
63
Nan Zhang9067b042017-03-17 14:04:43 -070064type pathMapping struct {
65 dest, src string
Nan Zhangf281bd82017-04-25 16:47:45 -070066 zipMethod uint16
67}
68
Jeff Gastonc3bdc972017-10-12 12:18:19 -070069type FileArg struct {
70 PathPrefixInZip, SourcePrefixToStrip string
71 SourceFiles []string
Colin Crossb7c69112018-09-18 16:51:43 -070072 JunkPaths bool
Jeff Gastonc3bdc972017-10-12 12:18:19 -070073 GlobDir string
74}
75
Colin Crossfe945b42018-09-27 15:00:07 -070076type FileArgsBuilder struct {
77 state FileArg
78 err error
79 fs pathtools.FileSystem
80
81 fileArgs []FileArg
82}
83
84func NewFileArgsBuilder() *FileArgsBuilder {
85 return &FileArgsBuilder{
86 fs: pathtools.OsFs,
87 }
88}
89
90func (b *FileArgsBuilder) JunkPaths(v bool) *FileArgsBuilder {
91 b.state.JunkPaths = v
92 b.state.SourcePrefixToStrip = ""
93 return b
94}
95
96func (b *FileArgsBuilder) SourcePrefixToStrip(prefixToStrip string) *FileArgsBuilder {
97 b.state.JunkPaths = false
98 b.state.SourcePrefixToStrip = prefixToStrip
99 return b
100}
101
102func (b *FileArgsBuilder) PathPrefixInZip(rootPrefix string) *FileArgsBuilder {
103 b.state.PathPrefixInZip = rootPrefix
104 return b
105}
106
107func (b *FileArgsBuilder) File(name string) *FileArgsBuilder {
108 if b.err != nil {
109 return b
110 }
111
112 arg := b.state
113 arg.SourceFiles = []string{name}
114 b.fileArgs = append(b.fileArgs, arg)
115 return b
116}
117
118func (b *FileArgsBuilder) Dir(name string) *FileArgsBuilder {
119 if b.err != nil {
120 return b
121 }
122
123 arg := b.state
124 arg.GlobDir = name
125 b.fileArgs = append(b.fileArgs, arg)
126 return b
127}
128
129func (b *FileArgsBuilder) List(name string) *FileArgsBuilder {
130 if b.err != nil {
131 return b
132 }
133
134 f, err := b.fs.Open(name)
135 if err != nil {
136 b.err = err
137 return b
138 }
139 defer f.Close()
140
141 list, err := ioutil.ReadAll(f)
142 if err != nil {
143 b.err = err
144 return b
145 }
146
147 arg := b.state
148 arg.SourceFiles = strings.Split(string(list), "\n")
149 b.fileArgs = append(b.fileArgs, arg)
150 return b
151}
152
153func (b *FileArgsBuilder) Error() error {
154 if b == nil {
155 return nil
156 }
157 return b.err
158}
159
160func (b *FileArgsBuilder) FileArgs() []FileArg {
161 if b == nil {
162 return nil
163 }
164 return b.fileArgs
165}
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700166
Colin Cross1d98ee22018-09-18 17:05:15 -0700167type IncorrectRelativeRootError struct {
168 RelativeRoot string
169 Path string
170}
171
172func (x IncorrectRelativeRootError) Error() string {
173 return fmt.Sprintf("path %q is outside relative root %q", x.Path, x.RelativeRoot)
174}
175
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700176type ZipWriter struct {
Colin Crosse5580972017-08-30 17:40:21 -0700177 time time.Time
178 createdFiles map[string]string
179 createdDirs map[string]string
180 directories bool
Colin Crosse19c7932015-04-24 15:08:38 -0700181
Dan Willemsen017d8932016-08-04 15:43:03 -0700182 errors chan error
183 writeOps chan chan *zipEntry
184
Jeff Gaston175f34c2017-08-17 21:43:21 -0700185 cpuRateLimiter *CPURateLimiter
186 memoryRateLimiter *MemoryRateLimiter
Dan Willemsen017d8932016-08-04 15:43:03 -0700187
188 compressorPool sync.Pool
189 compLevel int
Colin Cross05518bc2018-09-27 15:06:19 -0700190
191 fs pathtools.FileSystem
Dan Willemsen017d8932016-08-04 15:43:03 -0700192}
193
194type zipEntry struct {
195 fh *zip.FileHeader
196
197 // List of delayed io.Reader
198 futureReaders chan chan io.Reader
Jeff Gaston175f34c2017-08-17 21:43:21 -0700199
200 // Only used for passing into the MemoryRateLimiter to ensure we
201 // release as much memory as much as we request
202 allocatedSize int64
Colin Cross2fe66872015-03-30 17:20:39 -0700203}
204
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700205type ZipArgs struct {
Colin Crossfe945b42018-09-27 15:00:07 -0700206 FileArgs []FileArg
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700207 OutputFilePath string
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700208 EmulateJar bool
209 AddDirectoryEntriesToZip bool
210 CompressionLevel int
211 ManifestSourcePath string
212 NumParallelJobs int
213 NonDeflatedFiles map[string]bool
Colin Crossf83c1502017-11-10 13:11:02 -0800214 WriteIfChanged bool
Colin Cross05518bc2018-09-27 15:06:19 -0700215 Filesystem pathtools.FileSystem
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700216}
Colin Cross2fe66872015-03-30 17:20:39 -0700217
Nan Zhang674dd932018-01-26 18:30:36 -0800218const NOQUOTE = '\x00'
219
220func ReadRespFile(bytes []byte) []string {
221 var args []string
222 var arg []rune
223
224 isEscaping := false
225 quotingStart := NOQUOTE
226 for _, c := range string(bytes) {
227 switch {
228 case isEscaping:
229 if quotingStart == '"' {
230 if !(c == '"' || c == '\\') {
231 // '\"' or '\\' will be escaped under double quoting.
232 arg = append(arg, '\\')
233 }
234 }
235 arg = append(arg, c)
236 isEscaping = false
237 case c == '\\' && quotingStart != '\'':
238 isEscaping = true
239 case quotingStart == NOQUOTE && (c == '\'' || c == '"'):
240 quotingStart = c
241 case quotingStart != NOQUOTE && c == quotingStart:
242 quotingStart = NOQUOTE
243 case quotingStart == NOQUOTE && unicode.IsSpace(c):
244 // Current character is a space outside quotes
245 if len(arg) != 0 {
246 args = append(args, string(arg))
247 }
248 arg = arg[:0]
249 default:
250 arg = append(arg, c)
251 }
252 }
253
254 if len(arg) != 0 {
255 args = append(args, string(arg))
256 }
257
258 return args
259}
260
Colin Cross05518bc2018-09-27 15:06:19 -0700261func ZipTo(args ZipArgs, w io.Writer) error {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700262 if args.EmulateJar {
263 args.AddDirectoryEntriesToZip = true
Jeff Gaston8edbb3a2017-08-22 20:05:28 -0700264 }
265
Colin Cross05518bc2018-09-27 15:06:19 -0700266 z := &ZipWriter{
Colin Crossc7feeff2018-09-26 21:36:44 +0000267 time: jar.DefaultTime,
268 createdDirs: make(map[string]string),
269 createdFiles: make(map[string]string),
270 directories: args.AddDirectoryEntriesToZip,
271 compLevel: args.CompressionLevel,
Colin Cross05518bc2018-09-27 15:06:19 -0700272 fs: args.Filesystem,
Colin Cross2fe66872015-03-30 17:20:39 -0700273 }
Colin Cross05518bc2018-09-27 15:06:19 -0700274
275 if z.fs == nil {
276 z.fs = pathtools.OsFs
277 }
278
Nan Zhang9067b042017-03-17 14:04:43 -0700279 pathMappings := []pathMapping{}
Nan Zhang9067b042017-03-17 14:04:43 -0700280
Colin Crossd3216292018-09-14 15:06:31 -0700281 noCompression := args.CompressionLevel == 0
282
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700283 for _, fa := range args.FileArgs {
Colin Cross1d98ee22018-09-18 17:05:15 -0700284 var srcs []string
285 for _, s := range fa.SourceFiles {
286 s = strings.TrimSpace(s)
287 if s == "" {
288 continue
289 }
290
291 globbed, _, err := z.fs.Glob(s, nil, pathtools.DontFollowSymlinks)
292 if err != nil {
293 return err
294 }
295 if len(globbed) == 0 {
296 return &os.PathError{
297 Op: "stat",
298 Path: s,
299 Err: os.ErrNotExist,
300 }
301 }
302 srcs = append(srcs, globbed...)
303 }
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700304 if fa.GlobDir != "" {
Colin Cross1d98ee22018-09-18 17:05:15 -0700305 if exists, isDir, err := z.fs.Exists(fa.GlobDir); err != nil {
306 return err
307 } else if !exists {
308 return &os.PathError{
309 Op: "stat",
310 Path: fa.GlobDir,
311 Err: os.ErrNotExist,
312 }
313 } else if !isDir {
314 return &os.PathError{
315 Op: "stat",
316 Path: fa.GlobDir,
317 Err: syscall.ENOTDIR,
318 }
319 }
320 globbed, _, err := z.fs.Glob(filepath.Join(fa.GlobDir, "**/*"), nil, pathtools.DontFollowSymlinks)
321 if err != nil {
322 return err
323 }
324 srcs = append(srcs, globbed...)
Colin Cross7b10cf12017-08-30 14:12:21 -0700325 }
326 for _, src := range srcs {
Colin Crossb7c69112018-09-18 16:51:43 -0700327 err := fillPathPairs(fa, src, &pathMappings, args.NonDeflatedFiles, noCompression)
Colin Crossd3216292018-09-14 15:06:31 -0700328 if err != nil {
Colin Cross05518bc2018-09-27 15:06:19 -0700329 return err
Nan Zhang9067b042017-03-17 14:04:43 -0700330 }
331 }
332 }
333
Colin Cross05518bc2018-09-27 15:06:19 -0700334 return z.write(w, pathMappings, args.ManifestSourcePath, args.EmulateJar, args.NumParallelJobs)
335}
336
337func Zip(args ZipArgs) error {
338 if args.OutputFilePath == "" {
339 return fmt.Errorf("output file path must be nonempty")
340 }
341
Colin Crossf83c1502017-11-10 13:11:02 -0800342 buf := &bytes.Buffer{}
343 var out io.Writer = buf
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700344
Colin Crossf83c1502017-11-10 13:11:02 -0800345 if !args.WriteIfChanged {
346 f, err := os.Create(args.OutputFilePath)
347 if err != nil {
348 return err
349 }
350
351 defer f.Close()
352 defer func() {
353 if err != nil {
354 os.Remove(args.OutputFilePath)
355 }
356 }()
357
358 out = f
359 }
360
Colin Cross05518bc2018-09-27 15:06:19 -0700361 err := ZipTo(args, out)
Colin Crossf83c1502017-11-10 13:11:02 -0800362 if err != nil {
363 return err
364 }
365
366 if args.WriteIfChanged {
367 err := pathtools.WriteFileIfChanged(args.OutputFilePath, buf.Bytes(), 0666)
368 if err != nil {
369 return err
370 }
371 }
372
373 return nil
Colin Cross2fe66872015-03-30 17:20:39 -0700374}
375
Colin Crossb7c69112018-09-18 16:51:43 -0700376func fillPathPairs(fa FileArg, src string, pathMappings *[]pathMapping,
Colin Crossd3216292018-09-14 15:06:31 -0700377 nonDeflatedFiles map[string]bool, noCompression bool) error {
378
Colin Crossb7c69112018-09-18 16:51:43 -0700379 var dest string
380
381 if fa.JunkPaths {
382 dest = filepath.Base(src)
383 } else {
384 var err error
385 dest, err = filepath.Rel(fa.SourcePrefixToStrip, src)
386 if err != nil {
387 return err
388 }
Colin Cross1d98ee22018-09-18 17:05:15 -0700389 if strings.HasPrefix(dest, "../") {
390 return IncorrectRelativeRootError{
391 Path: src,
392 RelativeRoot: fa.SourcePrefixToStrip,
393 }
394 }
395
Nan Zhang9067b042017-03-17 14:04:43 -0700396 }
Colin Crossb7c69112018-09-18 16:51:43 -0700397 dest = filepath.Join(fa.PathPrefixInZip, dest)
Nan Zhang9067b042017-03-17 14:04:43 -0700398
Nan Zhangf281bd82017-04-25 16:47:45 -0700399 zipMethod := zip.Deflate
Colin Crossd3216292018-09-14 15:06:31 -0700400 if _, found := nonDeflatedFiles[dest]; found || noCompression {
Nan Zhangf281bd82017-04-25 16:47:45 -0700401 zipMethod = zip.Store
402 }
403 *pathMappings = append(*pathMappings,
404 pathMapping{dest: dest, src: src, zipMethod: zipMethod})
Nan Zhang9067b042017-03-17 14:04:43 -0700405
406 return nil
407}
408
Jeff Gastona2976952017-08-22 17:51:25 -0700409func jarSort(mappings []pathMapping) {
410 less := func(i int, j int) (smaller bool) {
411 return jar.EntryNamesLess(mappings[i].dest, mappings[j].dest)
412 }
413 sort.SliceStable(mappings, less)
414}
415
Colin Crossf83c1502017-11-10 13:11:02 -0800416func (z *ZipWriter) write(f io.Writer, pathMappings []pathMapping, manifest string, emulateJar bool, parallelJobs int) error {
Dan Willemsen017d8932016-08-04 15:43:03 -0700417 z.errors = make(chan error)
418 defer close(z.errors)
Colin Cross2fe66872015-03-30 17:20:39 -0700419
Dan Willemsen017d8932016-08-04 15:43:03 -0700420 // This channel size can be essentially unlimited -- it's used as a fifo
421 // queue decouple the CPU and IO loads. Directories don't require any
422 // compression time, but still cost some IO. Similar with small files that
423 // can be very fast to compress. Some files that are more difficult to
424 // compress won't take a corresponding longer time writing out.
425 //
426 // The optimum size here depends on your CPU and IO characteristics, and
427 // the the layout of your zip file. 1000 was chosen mostly at random as
428 // something that worked reasonably well for a test file.
429 //
430 // The RateLimit object will put the upper bounds on the number of
431 // parallel compressions and outstanding buffers.
432 z.writeOps = make(chan chan *zipEntry, 1000)
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700433 z.cpuRateLimiter = NewCPURateLimiter(int64(parallelJobs))
Jeff Gaston175f34c2017-08-17 21:43:21 -0700434 z.memoryRateLimiter = NewMemoryRateLimiter(0)
435 defer func() {
436 z.cpuRateLimiter.Stop()
437 z.memoryRateLimiter.Stop()
438 }()
Jeff Gastona2976952017-08-22 17:51:25 -0700439
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700440 if manifest != "" && !emulateJar {
Colin Cross635acc92017-09-12 22:50:46 -0700441 return errors.New("must specify --jar when specifying a manifest via -m")
Jeff Gastona2976952017-08-22 17:51:25 -0700442 }
443
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700444 if emulateJar {
Colin Cross635acc92017-09-12 22:50:46 -0700445 // manifest may be empty, in which case addManifest will fill in a default
446 pathMappings = append(pathMappings, pathMapping{jar.ManifestFile, manifest, zip.Deflate})
447
Jeff Gastona2976952017-08-22 17:51:25 -0700448 jarSort(pathMappings)
449 }
450
Dan Willemsen017d8932016-08-04 15:43:03 -0700451 go func() {
452 var err error
453 defer close(z.writeOps)
454
Nan Zhang9067b042017-03-17 14:04:43 -0700455 for _, ele := range pathMappings {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700456 if emulateJar && ele.dest == jar.ManifestFile {
Jeff Gastoncef50b92017-08-23 15:41:35 -0700457 err = z.addManifest(ele.dest, ele.src, ele.zipMethod)
458 } else {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700459 err = z.addFile(ele.dest, ele.src, ele.zipMethod, emulateJar)
Jeff Gastoncef50b92017-08-23 15:41:35 -0700460 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700461 if err != nil {
462 z.errors <- err
463 return
464 }
465 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700466 }()
467
468 zipw := zip.NewWriter(f)
469
470 var currentWriteOpChan chan *zipEntry
471 var currentWriter io.WriteCloser
472 var currentReaders chan chan io.Reader
473 var currentReader chan io.Reader
474 var done bool
475
476 for !done {
477 var writeOpsChan chan chan *zipEntry
478 var writeOpChan chan *zipEntry
479 var readersChan chan chan io.Reader
480
481 if currentReader != nil {
482 // Only read and process errors
483 } else if currentReaders != nil {
484 readersChan = currentReaders
485 } else if currentWriteOpChan != nil {
486 writeOpChan = currentWriteOpChan
487 } else {
488 writeOpsChan = z.writeOps
489 }
490
491 select {
492 case writeOp, ok := <-writeOpsChan:
493 if !ok {
494 done = true
495 }
496
497 currentWriteOpChan = writeOp
498
499 case op := <-writeOpChan:
500 currentWriteOpChan = nil
501
Colin Crossf83c1502017-11-10 13:11:02 -0800502 var err error
Dan Willemsen017d8932016-08-04 15:43:03 -0700503 if op.fh.Method == zip.Deflate {
504 currentWriter, err = zipw.CreateCompressedHeader(op.fh)
505 } else {
506 var zw io.Writer
Jeff Gastonc5eb66d2017-08-24 14:11:27 -0700507
508 op.fh.CompressedSize64 = op.fh.UncompressedSize64
509
510 zw, err = zipw.CreateHeaderAndroid(op.fh)
Dan Willemsen017d8932016-08-04 15:43:03 -0700511 currentWriter = nopCloser{zw}
512 }
513 if err != nil {
514 return err
515 }
516
517 currentReaders = op.futureReaders
518 if op.futureReaders == nil {
519 currentWriter.Close()
520 currentWriter = nil
521 }
Jeff Gaston175f34c2017-08-17 21:43:21 -0700522 z.memoryRateLimiter.Finish(op.allocatedSize)
Dan Willemsen017d8932016-08-04 15:43:03 -0700523
524 case futureReader, ok := <-readersChan:
525 if !ok {
526 // Done with reading
527 currentWriter.Close()
528 currentWriter = nil
529 currentReaders = nil
530 }
531
532 currentReader = futureReader
533
534 case reader := <-currentReader:
Colin Crossf83c1502017-11-10 13:11:02 -0800535 _, err := io.Copy(currentWriter, reader)
Dan Willemsen017d8932016-08-04 15:43:03 -0700536 if err != nil {
537 return err
538 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700539
540 currentReader = nil
541
Colin Crossf83c1502017-11-10 13:11:02 -0800542 case err := <-z.errors:
Colin Cross2fe66872015-03-30 17:20:39 -0700543 return err
544 }
545 }
546
Dan Willemsen017d8932016-08-04 15:43:03 -0700547 // One last chance to catch an error
548 select {
Colin Crossf83c1502017-11-10 13:11:02 -0800549 case err := <-z.errors:
Dan Willemsen017d8932016-08-04 15:43:03 -0700550 return err
551 default:
552 zipw.Close()
553 return nil
Colin Cross2fe66872015-03-30 17:20:39 -0700554 }
Colin Cross2fe66872015-03-30 17:20:39 -0700555}
556
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700557// imports (possibly with compression) <src> into the zip at sub-path <dest>
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700558func (z *ZipWriter) addFile(dest, src string, method uint16, emulateJar bool) error {
Dan Willemsen017d8932016-08-04 15:43:03 -0700559 var fileSize int64
Dan Willemsen10462b32017-03-15 19:02:51 -0700560 var executable bool
Dan Willemsen017d8932016-08-04 15:43:03 -0700561
Colin Cross05518bc2018-09-27 15:06:19 -0700562 if s, err := z.fs.Lstat(src); err != nil {
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700563 return err
564 } else if s.IsDir() {
Colin Cross957cc4e2015-04-24 15:10:32 -0700565 if z.directories {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700566 return z.writeDirectory(dest, src, emulateJar)
Colin Cross957cc4e2015-04-24 15:10:32 -0700567 }
568 return nil
Dan Willemsen017d8932016-08-04 15:43:03 -0700569 } else {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700570 if err := z.writeDirectory(filepath.Dir(dest), src, emulateJar); err != nil {
Colin Crosse5580972017-08-30 17:40:21 -0700571 return err
572 }
573
574 if prev, exists := z.createdDirs[dest]; exists {
575 return fmt.Errorf("destination %q is both a directory %q and a file %q", dest, prev, src)
576 }
577 if prev, exists := z.createdFiles[dest]; exists {
578 return fmt.Errorf("destination %q has two files %q and %q", dest, prev, src)
579 }
580
581 z.createdFiles[dest] = src
582
583 if s.Mode()&os.ModeSymlink != 0 {
584 return z.writeSymlink(dest, src)
585 } else if !s.Mode().IsRegular() {
586 return fmt.Errorf("%s is not a file, directory, or symlink", src)
587 }
588
Dan Willemsen017d8932016-08-04 15:43:03 -0700589 fileSize = s.Size()
Dan Willemsen10462b32017-03-15 19:02:51 -0700590 executable = s.Mode()&0100 != 0
Colin Cross957cc4e2015-04-24 15:10:32 -0700591 }
592
Colin Cross05518bc2018-09-27 15:06:19 -0700593 r, err := z.fs.Open(src)
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700594 if err != nil {
595 return err
596 }
597
598 header := &zip.FileHeader{
599 Name: dest,
600 Method: method,
601 UncompressedSize64: uint64(fileSize),
602 }
603
604 if executable {
605 header.SetMode(0700)
606 }
607
608 return z.writeFileContents(header, r)
609}
610
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700611func (z *ZipWriter) addManifest(dest string, src string, method uint16) error {
Colin Crosse5580972017-08-30 17:40:21 -0700612 if prev, exists := z.createdDirs[dest]; exists {
613 return fmt.Errorf("destination %q is both a directory %q and a file %q", dest, prev, src)
614 }
615 if prev, exists := z.createdFiles[dest]; exists {
616 return fmt.Errorf("destination %q has two files %q and %q", dest, prev, src)
617 }
618
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700619 if err := z.writeDirectory(filepath.Dir(dest), src, true); err != nil {
Colin Cross635acc92017-09-12 22:50:46 -0700620 return err
Jeff Gastoncef50b92017-08-23 15:41:35 -0700621 }
622
Colin Cross05518bc2018-09-27 15:06:19 -0700623 var contents []byte
624 if src != "" {
625 f, err := z.fs.Open(src)
626 if err != nil {
627 return err
628 }
629
630 contents, err = ioutil.ReadAll(f)
631 f.Close()
632 if err != nil {
633 return err
634 }
635 }
636
637 fh, buf, err := jar.ManifestFileContents(contents)
Colin Cross635acc92017-09-12 22:50:46 -0700638 if err != nil {
639 return err
Jeff Gastoncef50b92017-08-23 15:41:35 -0700640 }
641
Colin Cross635acc92017-09-12 22:50:46 -0700642 reader := &byteReaderCloser{bytes.NewReader(buf), ioutil.NopCloser(nil)}
643
644 return z.writeFileContents(fh, reader)
Jeff Gastoncef50b92017-08-23 15:41:35 -0700645}
646
Colin Cross05518bc2018-09-27 15:06:19 -0700647func (z *ZipWriter) writeFileContents(header *zip.FileHeader, r pathtools.ReaderAtSeekerCloser) (err error) {
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700648
649 header.SetModTime(z.time)
650
Dan Willemsen017d8932016-08-04 15:43:03 -0700651 compressChan := make(chan *zipEntry, 1)
652 z.writeOps <- compressChan
653
654 // Pre-fill a zipEntry, it will be sent in the compressChan once
655 // we're sure about the Method and CRC.
656 ze := &zipEntry{
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700657 fh: header,
Dan Willemsen10462b32017-03-15 19:02:51 -0700658 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700659
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700660 ze.allocatedSize = int64(header.UncompressedSize64)
Jeff Gaston175f34c2017-08-17 21:43:21 -0700661 z.cpuRateLimiter.Request()
662 z.memoryRateLimiter.Request(ze.allocatedSize)
Dan Willemsen017d8932016-08-04 15:43:03 -0700663
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700664 fileSize := int64(header.UncompressedSize64)
665 if fileSize == 0 {
666 fileSize = int64(header.UncompressedSize)
667 }
668
669 if header.Method == zip.Deflate && fileSize >= minParallelFileSize {
Dan Willemsen017d8932016-08-04 15:43:03 -0700670 wg := new(sync.WaitGroup)
671
672 // Allocate enough buffer to hold all readers. We'll limit
673 // this based on actual buffer sizes in RateLimit.
674 ze.futureReaders = make(chan chan io.Reader, (fileSize/parallelBlockSize)+1)
675
676 // Calculate the CRC in the background, since reading the entire
677 // file could take a while.
678 //
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700679 // We could split this up into chunks as well, but it's faster
Dan Willemsen017d8932016-08-04 15:43:03 -0700680 // than the compression. Due to the Go Zip API, we also need to
681 // know the result before we can begin writing the compressed
682 // data out to the zipfile.
683 wg.Add(1)
Jeff Gaston175f34c2017-08-17 21:43:21 -0700684 go z.crcFile(r, ze, compressChan, wg)
Dan Willemsen017d8932016-08-04 15:43:03 -0700685
686 for start := int64(0); start < fileSize; start += parallelBlockSize {
687 sr := io.NewSectionReader(r, start, parallelBlockSize)
688 resultChan := make(chan io.Reader, 1)
689 ze.futureReaders <- resultChan
690
Jeff Gaston175f34c2017-08-17 21:43:21 -0700691 z.cpuRateLimiter.Request()
Dan Willemsen017d8932016-08-04 15:43:03 -0700692
693 last := !(start+parallelBlockSize < fileSize)
694 var dict []byte
695 if start >= windowSize {
696 dict, err = ioutil.ReadAll(io.NewSectionReader(r, start-windowSize, windowSize))
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700697 if err != nil {
698 return err
699 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700700 }
701
702 wg.Add(1)
Jeff Gaston175f34c2017-08-17 21:43:21 -0700703 go z.compressPartialFile(sr, dict, last, resultChan, wg)
Dan Willemsen017d8932016-08-04 15:43:03 -0700704 }
705
706 close(ze.futureReaders)
707
708 // Close the file handle after all readers are done
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700709 go func(wg *sync.WaitGroup, closer io.Closer) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700710 wg.Wait()
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700711 closer.Close()
Dan Willemsen017d8932016-08-04 15:43:03 -0700712 }(wg, r)
713 } else {
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700714 go func() {
715 z.compressWholeFile(ze, r, compressChan)
716 r.Close()
717 }()
Dan Willemsen017d8932016-08-04 15:43:03 -0700718 }
719
720 return nil
721}
722
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700723func (z *ZipWriter) crcFile(r io.Reader, ze *zipEntry, resultChan chan *zipEntry, wg *sync.WaitGroup) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700724 defer wg.Done()
Jeff Gaston175f34c2017-08-17 21:43:21 -0700725 defer z.cpuRateLimiter.Finish()
Dan Willemsen017d8932016-08-04 15:43:03 -0700726
727 crc := crc32.NewIEEE()
728 _, err := io.Copy(crc, r)
729 if err != nil {
730 z.errors <- err
731 return
732 }
733
734 ze.fh.CRC32 = crc.Sum32()
735 resultChan <- ze
736 close(resultChan)
737}
738
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700739func (z *ZipWriter) compressPartialFile(r io.Reader, dict []byte, last bool, resultChan chan io.Reader, wg *sync.WaitGroup) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700740 defer wg.Done()
741
742 result, err := z.compressBlock(r, dict, last)
743 if err != nil {
744 z.errors <- err
745 return
746 }
747
Jeff Gaston175f34c2017-08-17 21:43:21 -0700748 z.cpuRateLimiter.Finish()
749
Dan Willemsen017d8932016-08-04 15:43:03 -0700750 resultChan <- result
751}
752
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700753func (z *ZipWriter) compressBlock(r io.Reader, dict []byte, last bool) (*bytes.Buffer, error) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700754 buf := new(bytes.Buffer)
755 var fw *flate.Writer
756 var err error
757 if len(dict) > 0 {
758 // There's no way to Reset a Writer with a new dictionary, so
759 // don't use the Pool
760 fw, err = flate.NewWriterDict(buf, z.compLevel, dict)
761 } else {
762 var ok bool
763 if fw, ok = z.compressorPool.Get().(*flate.Writer); ok {
764 fw.Reset(buf)
765 } else {
766 fw, err = flate.NewWriter(buf, z.compLevel)
767 }
768 defer z.compressorPool.Put(fw)
769 }
770 if err != nil {
771 return nil, err
772 }
773
774 _, err = io.Copy(fw, r)
775 if err != nil {
776 return nil, err
777 }
778 if last {
779 fw.Close()
780 } else {
781 fw.Flush()
782 }
783
784 return buf, nil
785}
786
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700787func (z *ZipWriter) compressWholeFile(ze *zipEntry, r io.ReadSeeker, compressChan chan *zipEntry) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700788
Dan Willemsen017d8932016-08-04 15:43:03 -0700789 crc := crc32.NewIEEE()
Dan Willemsena8b55022017-03-15 21:49:26 -0700790 _, err := io.Copy(crc, r)
Colin Cross2fe66872015-03-30 17:20:39 -0700791 if err != nil {
Dan Willemsen017d8932016-08-04 15:43:03 -0700792 z.errors <- err
793 return
Colin Cross2fe66872015-03-30 17:20:39 -0700794 }
795
Dan Willemsena8b55022017-03-15 21:49:26 -0700796 ze.fh.CRC32 = crc.Sum32()
Colin Cross2fe66872015-03-30 17:20:39 -0700797
Dan Willemsen017d8932016-08-04 15:43:03 -0700798 _, err = r.Seek(0, 0)
Colin Cross2fe66872015-03-30 17:20:39 -0700799 if err != nil {
Dan Willemsen017d8932016-08-04 15:43:03 -0700800 z.errors <- err
801 return
Colin Cross2fe66872015-03-30 17:20:39 -0700802 }
803
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700804 readFile := func(reader io.ReadSeeker) ([]byte, error) {
805 _, err := reader.Seek(0, 0)
Nan Zhangf281bd82017-04-25 16:47:45 -0700806 if err != nil {
807 return nil, err
808 }
809
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700810 buf, err := ioutil.ReadAll(reader)
Nan Zhangf281bd82017-04-25 16:47:45 -0700811 if err != nil {
812 return nil, err
813 }
814
815 return buf, nil
816 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700817
Dan Willemsena8b55022017-03-15 21:49:26 -0700818 ze.futureReaders = make(chan chan io.Reader, 1)
Dan Willemsen017d8932016-08-04 15:43:03 -0700819 futureReader := make(chan io.Reader, 1)
820 ze.futureReaders <- futureReader
821 close(ze.futureReaders)
822
Nan Zhangf281bd82017-04-25 16:47:45 -0700823 if ze.fh.Method == zip.Deflate {
824 compressed, err := z.compressBlock(r, nil, true)
825 if err != nil {
826 z.errors <- err
827 return
828 }
829 if uint64(compressed.Len()) < ze.fh.UncompressedSize64 {
830 futureReader <- compressed
Nan Zhangf281bd82017-04-25 16:47:45 -0700831 } else {
832 buf, err := readFile(r)
833 if err != nil {
834 z.errors <- err
835 return
836 }
837 ze.fh.Method = zip.Store
838 futureReader <- bytes.NewReader(buf)
Nan Zhangf281bd82017-04-25 16:47:45 -0700839 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700840 } else {
Nan Zhangf281bd82017-04-25 16:47:45 -0700841 buf, err := readFile(r)
Dan Willemsen017d8932016-08-04 15:43:03 -0700842 if err != nil {
843 z.errors <- err
844 return
845 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700846 ze.fh.Method = zip.Store
847 futureReader <- bytes.NewReader(buf)
Dan Willemsen017d8932016-08-04 15:43:03 -0700848 }
Nan Zhangf281bd82017-04-25 16:47:45 -0700849
Jeff Gaston175f34c2017-08-17 21:43:21 -0700850 z.cpuRateLimiter.Finish()
851
Dan Willemsen017d8932016-08-04 15:43:03 -0700852 close(futureReader)
853
854 compressChan <- ze
855 close(compressChan)
Colin Cross2fe66872015-03-30 17:20:39 -0700856}
Colin Crosse19c7932015-04-24 15:08:38 -0700857
Colin Crosse5580972017-08-30 17:40:21 -0700858// writeDirectory annotates that dir is a directory created for the src file or directory, and adds
859// the directory entry to the zip file if directories are enabled.
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700860func (z *ZipWriter) writeDirectory(dir string, src string, emulateJar bool) error {
Jeff Gaston2d174132017-08-15 18:05:56 -0700861 // clean the input
Colin Crosse5580972017-08-30 17:40:21 -0700862 dir = filepath.Clean(dir)
Jeff Gaston2d174132017-08-15 18:05:56 -0700863
864 // discover any uncreated directories in the path
865 zipDirs := []string{}
Colin Crosse5580972017-08-30 17:40:21 -0700866 for dir != "" && dir != "." {
867 if _, exists := z.createdDirs[dir]; exists {
868 break
869 }
Jeff Gaston2d174132017-08-15 18:05:56 -0700870
Colin Crosse5580972017-08-30 17:40:21 -0700871 if prev, exists := z.createdFiles[dir]; exists {
872 return fmt.Errorf("destination %q is both a directory %q and a file %q", dir, src, prev)
873 }
874
875 z.createdDirs[dir] = src
Jeff Gaston2d174132017-08-15 18:05:56 -0700876 // parent directories precede their children
Colin Crosse5580972017-08-30 17:40:21 -0700877 zipDirs = append([]string{dir}, zipDirs...)
Jeff Gaston2d174132017-08-15 18:05:56 -0700878
Colin Crosse5580972017-08-30 17:40:21 -0700879 dir = filepath.Dir(dir)
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700880 }
881
Colin Crosse5580972017-08-30 17:40:21 -0700882 if z.directories {
883 // make a directory entry for each uncreated directory
884 for _, cleanDir := range zipDirs {
Colin Cross635acc92017-09-12 22:50:46 -0700885 var dirHeader *zip.FileHeader
Colin Crosse19c7932015-04-24 15:08:38 -0700886
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700887 if emulateJar && cleanDir+"/" == jar.MetaDir {
Colin Cross635acc92017-09-12 22:50:46 -0700888 dirHeader = jar.MetaDirFileHeader()
889 } else {
890 dirHeader = &zip.FileHeader{
891 Name: cleanDir + "/",
892 }
893 dirHeader.SetMode(0700 | os.ModeDir)
Colin Crosse5580972017-08-30 17:40:21 -0700894 }
Jeff Gaston8edbb3a2017-08-22 20:05:28 -0700895
Colin Cross635acc92017-09-12 22:50:46 -0700896 dirHeader.SetModTime(z.time)
897
Colin Crosse5580972017-08-30 17:40:21 -0700898 ze := make(chan *zipEntry, 1)
899 ze <- &zipEntry{
900 fh: dirHeader,
901 }
902 close(ze)
903 z.writeOps <- ze
Colin Crosse19c7932015-04-24 15:08:38 -0700904 }
Colin Crosse19c7932015-04-24 15:08:38 -0700905 }
906
907 return nil
908}
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700909
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700910func (z *ZipWriter) writeSymlink(rel, file string) error {
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700911 fileHeader := &zip.FileHeader{
912 Name: rel,
913 }
914 fileHeader.SetModTime(z.time)
Colin Cross297d9bc2018-06-22 16:37:47 -0700915 fileHeader.SetMode(0777 | os.ModeSymlink)
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700916
Colin Cross05518bc2018-09-27 15:06:19 -0700917 dest, err := z.fs.Readlink(file)
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700918 if err != nil {
919 return err
920 }
921
Colin Cross297d9bc2018-06-22 16:37:47 -0700922 fileHeader.UncompressedSize64 = uint64(len(dest))
923 fileHeader.CRC32 = crc32.ChecksumIEEE([]byte(dest))
924
Dan Willemsen017d8932016-08-04 15:43:03 -0700925 ze := make(chan *zipEntry, 1)
926 futureReaders := make(chan chan io.Reader, 1)
927 futureReader := make(chan io.Reader, 1)
928 futureReaders <- futureReader
929 close(futureReaders)
930 futureReader <- bytes.NewBufferString(dest)
931 close(futureReader)
932
Dan Willemsen017d8932016-08-04 15:43:03 -0700933 ze <- &zipEntry{
934 fh: fileHeader,
935 futureReaders: futureReaders,
936 }
937 close(ze)
938 z.writeOps <- ze
939
940 return nil
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700941}