blob: d8507df2caf4602ee578c96c3812114884cb7fbb [file] [log] [blame]
Colin Cross2fe66872015-03-30 17:20:39 -07001// Copyright 2015 Google Inc. All rights reserved.
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7// http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
Jeff Gaston11b5c512017-10-12 12:19:14 -070015package zip
Colin Cross2fe66872015-03-30 17:20:39 -070016
17import (
Dan Willemsen017d8932016-08-04 15:43:03 -070018 "bytes"
19 "compress/flate"
Jeff Gastona2976952017-08-22 17:51:25 -070020 "errors"
Colin Cross2fe66872015-03-30 17:20:39 -070021 "fmt"
Dan Willemsen017d8932016-08-04 15:43:03 -070022 "hash/crc32"
Colin Cross2fe66872015-03-30 17:20:39 -070023 "io"
24 "io/ioutil"
25 "os"
26 "path/filepath"
Jeff Gastona2976952017-08-22 17:51:25 -070027 "sort"
Colin Cross2fe66872015-03-30 17:20:39 -070028 "strings"
Dan Willemsen017d8932016-08-04 15:43:03 -070029 "sync"
Colin Cross1d98ee22018-09-18 17:05:15 -070030 "syscall"
Colin Cross2fe66872015-03-30 17:20:39 -070031 "time"
Nan Zhang674dd932018-01-26 18:30:36 -080032 "unicode"
Dan Willemsen017d8932016-08-04 15:43:03 -070033
Colin Crossf83c1502017-11-10 13:11:02 -080034 "github.com/google/blueprint/pathtools"
35
Jeff Gastona2976952017-08-22 17:51:25 -070036 "android/soong/jar"
Dan Willemsen017d8932016-08-04 15:43:03 -070037 "android/soong/third_party/zip"
Colin Cross2fe66872015-03-30 17:20:39 -070038)
39
Dan Willemsen017d8932016-08-04 15:43:03 -070040// Block size used during parallel compression of a single file.
41const parallelBlockSize = 1 * 1024 * 1024 // 1MB
42
43// Minimum file size to use parallel compression. It requires more
44// flate.Writer allocations, since we can't change the dictionary
45// during Reset
46const minParallelFileSize = parallelBlockSize * 6
47
48// Size of the ZIP compression window (32KB)
49const windowSize = 32 * 1024
50
51type nopCloser struct {
52 io.Writer
53}
54
55func (nopCloser) Close() error {
56 return nil
57}
58
Jeff Gastoncef50b92017-08-23 15:41:35 -070059type byteReaderCloser struct {
Colin Cross635acc92017-09-12 22:50:46 -070060 *bytes.Reader
Jeff Gastoncef50b92017-08-23 15:41:35 -070061 io.Closer
62}
63
Nan Zhang9067b042017-03-17 14:04:43 -070064type pathMapping struct {
65 dest, src string
Nan Zhangf281bd82017-04-25 16:47:45 -070066 zipMethod uint16
67}
68
Jeff Gastonc3bdc972017-10-12 12:18:19 -070069type FileArg struct {
70 PathPrefixInZip, SourcePrefixToStrip string
71 SourceFiles []string
Colin Crossb7c69112018-09-18 16:51:43 -070072 JunkPaths bool
Jeff Gastonc3bdc972017-10-12 12:18:19 -070073 GlobDir string
74}
75
Colin Crossfe945b42018-09-27 15:00:07 -070076type FileArgsBuilder struct {
77 state FileArg
78 err error
79 fs pathtools.FileSystem
80
81 fileArgs []FileArg
82}
83
84func NewFileArgsBuilder() *FileArgsBuilder {
85 return &FileArgsBuilder{
86 fs: pathtools.OsFs,
87 }
88}
89
90func (b *FileArgsBuilder) JunkPaths(v bool) *FileArgsBuilder {
91 b.state.JunkPaths = v
92 b.state.SourcePrefixToStrip = ""
93 return b
94}
95
96func (b *FileArgsBuilder) SourcePrefixToStrip(prefixToStrip string) *FileArgsBuilder {
97 b.state.JunkPaths = false
98 b.state.SourcePrefixToStrip = prefixToStrip
99 return b
100}
101
102func (b *FileArgsBuilder) PathPrefixInZip(rootPrefix string) *FileArgsBuilder {
103 b.state.PathPrefixInZip = rootPrefix
104 return b
105}
106
107func (b *FileArgsBuilder) File(name string) *FileArgsBuilder {
108 if b.err != nil {
109 return b
110 }
111
112 arg := b.state
113 arg.SourceFiles = []string{name}
114 b.fileArgs = append(b.fileArgs, arg)
115 return b
116}
117
118func (b *FileArgsBuilder) Dir(name string) *FileArgsBuilder {
119 if b.err != nil {
120 return b
121 }
122
123 arg := b.state
124 arg.GlobDir = name
125 b.fileArgs = append(b.fileArgs, arg)
126 return b
127}
128
129func (b *FileArgsBuilder) List(name string) *FileArgsBuilder {
130 if b.err != nil {
131 return b
132 }
133
134 f, err := b.fs.Open(name)
135 if err != nil {
136 b.err = err
137 return b
138 }
139 defer f.Close()
140
141 list, err := ioutil.ReadAll(f)
142 if err != nil {
143 b.err = err
144 return b
145 }
146
147 arg := b.state
148 arg.SourceFiles = strings.Split(string(list), "\n")
149 b.fileArgs = append(b.fileArgs, arg)
150 return b
151}
152
153func (b *FileArgsBuilder) Error() error {
154 if b == nil {
155 return nil
156 }
157 return b.err
158}
159
160func (b *FileArgsBuilder) FileArgs() []FileArg {
161 if b == nil {
162 return nil
163 }
164 return b.fileArgs
165}
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700166
Colin Cross1d98ee22018-09-18 17:05:15 -0700167type IncorrectRelativeRootError struct {
168 RelativeRoot string
169 Path string
170}
171
172func (x IncorrectRelativeRootError) Error() string {
173 return fmt.Sprintf("path %q is outside relative root %q", x.Path, x.RelativeRoot)
174}
175
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700176type ZipWriter struct {
Colin Crosse5580972017-08-30 17:40:21 -0700177 time time.Time
178 createdFiles map[string]string
179 createdDirs map[string]string
180 directories bool
Colin Crosse19c7932015-04-24 15:08:38 -0700181
Dan Willemsen017d8932016-08-04 15:43:03 -0700182 errors chan error
183 writeOps chan chan *zipEntry
184
Jeff Gaston175f34c2017-08-17 21:43:21 -0700185 cpuRateLimiter *CPURateLimiter
186 memoryRateLimiter *MemoryRateLimiter
Dan Willemsen017d8932016-08-04 15:43:03 -0700187
188 compressorPool sync.Pool
189 compLevel int
Colin Cross05518bc2018-09-27 15:06:19 -0700190
Colin Cross09f11052018-09-21 15:12:39 -0700191 followSymlinks pathtools.ShouldFollowSymlinks
192
Colin Cross05518bc2018-09-27 15:06:19 -0700193 fs pathtools.FileSystem
Dan Willemsen017d8932016-08-04 15:43:03 -0700194}
195
196type zipEntry struct {
197 fh *zip.FileHeader
198
199 // List of delayed io.Reader
200 futureReaders chan chan io.Reader
Jeff Gaston175f34c2017-08-17 21:43:21 -0700201
202 // Only used for passing into the MemoryRateLimiter to ensure we
203 // release as much memory as much as we request
204 allocatedSize int64
Colin Cross2fe66872015-03-30 17:20:39 -0700205}
206
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700207type ZipArgs struct {
Colin Crossfe945b42018-09-27 15:00:07 -0700208 FileArgs []FileArg
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700209 OutputFilePath string
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700210 EmulateJar bool
211 AddDirectoryEntriesToZip bool
212 CompressionLevel int
213 ManifestSourcePath string
214 NumParallelJobs int
215 NonDeflatedFiles map[string]bool
Colin Crossf83c1502017-11-10 13:11:02 -0800216 WriteIfChanged bool
Colin Cross09f11052018-09-21 15:12:39 -0700217 StoreSymlinks bool
218
219 Filesystem pathtools.FileSystem
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700220}
Colin Cross2fe66872015-03-30 17:20:39 -0700221
Nan Zhang674dd932018-01-26 18:30:36 -0800222const NOQUOTE = '\x00'
223
224func ReadRespFile(bytes []byte) []string {
225 var args []string
226 var arg []rune
227
228 isEscaping := false
229 quotingStart := NOQUOTE
230 for _, c := range string(bytes) {
231 switch {
232 case isEscaping:
233 if quotingStart == '"' {
234 if !(c == '"' || c == '\\') {
235 // '\"' or '\\' will be escaped under double quoting.
236 arg = append(arg, '\\')
237 }
238 }
239 arg = append(arg, c)
240 isEscaping = false
241 case c == '\\' && quotingStart != '\'':
242 isEscaping = true
243 case quotingStart == NOQUOTE && (c == '\'' || c == '"'):
244 quotingStart = c
245 case quotingStart != NOQUOTE && c == quotingStart:
246 quotingStart = NOQUOTE
247 case quotingStart == NOQUOTE && unicode.IsSpace(c):
248 // Current character is a space outside quotes
249 if len(arg) != 0 {
250 args = append(args, string(arg))
251 }
252 arg = arg[:0]
253 default:
254 arg = append(arg, c)
255 }
256 }
257
258 if len(arg) != 0 {
259 args = append(args, string(arg))
260 }
261
262 return args
263}
264
Colin Cross05518bc2018-09-27 15:06:19 -0700265func ZipTo(args ZipArgs, w io.Writer) error {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700266 if args.EmulateJar {
267 args.AddDirectoryEntriesToZip = true
Jeff Gaston8edbb3a2017-08-22 20:05:28 -0700268 }
269
Colin Cross09f11052018-09-21 15:12:39 -0700270 // Have Glob follow symlinks if they are not being stored as symlinks in the zip file.
271 followSymlinks := pathtools.ShouldFollowSymlinks(!args.StoreSymlinks)
272
Colin Cross05518bc2018-09-27 15:06:19 -0700273 z := &ZipWriter{
Colin Cross09f11052018-09-21 15:12:39 -0700274 time: jar.DefaultTime,
275 createdDirs: make(map[string]string),
276 createdFiles: make(map[string]string),
277 directories: args.AddDirectoryEntriesToZip,
278 compLevel: args.CompressionLevel,
279 followSymlinks: followSymlinks,
280 fs: args.Filesystem,
Colin Cross2fe66872015-03-30 17:20:39 -0700281 }
Colin Cross05518bc2018-09-27 15:06:19 -0700282
283 if z.fs == nil {
284 z.fs = pathtools.OsFs
285 }
286
Nan Zhang9067b042017-03-17 14:04:43 -0700287 pathMappings := []pathMapping{}
Nan Zhang9067b042017-03-17 14:04:43 -0700288
Colin Crossd3216292018-09-14 15:06:31 -0700289 noCompression := args.CompressionLevel == 0
290
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700291 for _, fa := range args.FileArgs {
Colin Cross1d98ee22018-09-18 17:05:15 -0700292 var srcs []string
293 for _, s := range fa.SourceFiles {
294 s = strings.TrimSpace(s)
295 if s == "" {
296 continue
297 }
298
Colin Cross09f11052018-09-21 15:12:39 -0700299 globbed, _, err := z.fs.Glob(s, nil, followSymlinks)
Colin Cross1d98ee22018-09-18 17:05:15 -0700300 if err != nil {
301 return err
302 }
303 if len(globbed) == 0 {
304 return &os.PathError{
305 Op: "stat",
306 Path: s,
307 Err: os.ErrNotExist,
308 }
309 }
310 srcs = append(srcs, globbed...)
311 }
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700312 if fa.GlobDir != "" {
Colin Cross1d98ee22018-09-18 17:05:15 -0700313 if exists, isDir, err := z.fs.Exists(fa.GlobDir); err != nil {
314 return err
315 } else if !exists {
316 return &os.PathError{
317 Op: "stat",
318 Path: fa.GlobDir,
319 Err: os.ErrNotExist,
320 }
321 } else if !isDir {
322 return &os.PathError{
323 Op: "stat",
324 Path: fa.GlobDir,
325 Err: syscall.ENOTDIR,
326 }
327 }
Colin Cross09f11052018-09-21 15:12:39 -0700328 globbed, _, err := z.fs.Glob(filepath.Join(fa.GlobDir, "**/*"), nil, followSymlinks)
Colin Cross1d98ee22018-09-18 17:05:15 -0700329 if err != nil {
330 return err
331 }
332 srcs = append(srcs, globbed...)
Colin Cross7b10cf12017-08-30 14:12:21 -0700333 }
334 for _, src := range srcs {
Colin Crossb7c69112018-09-18 16:51:43 -0700335 err := fillPathPairs(fa, src, &pathMappings, args.NonDeflatedFiles, noCompression)
Colin Crossd3216292018-09-14 15:06:31 -0700336 if err != nil {
Colin Cross05518bc2018-09-27 15:06:19 -0700337 return err
Nan Zhang9067b042017-03-17 14:04:43 -0700338 }
339 }
340 }
341
Colin Cross05518bc2018-09-27 15:06:19 -0700342 return z.write(w, pathMappings, args.ManifestSourcePath, args.EmulateJar, args.NumParallelJobs)
343}
344
345func Zip(args ZipArgs) error {
346 if args.OutputFilePath == "" {
347 return fmt.Errorf("output file path must be nonempty")
348 }
349
Colin Crossf83c1502017-11-10 13:11:02 -0800350 buf := &bytes.Buffer{}
351 var out io.Writer = buf
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700352
Colin Crossf83c1502017-11-10 13:11:02 -0800353 if !args.WriteIfChanged {
354 f, err := os.Create(args.OutputFilePath)
355 if err != nil {
356 return err
357 }
358
359 defer f.Close()
360 defer func() {
361 if err != nil {
362 os.Remove(args.OutputFilePath)
363 }
364 }()
365
366 out = f
367 }
368
Colin Cross05518bc2018-09-27 15:06:19 -0700369 err := ZipTo(args, out)
Colin Crossf83c1502017-11-10 13:11:02 -0800370 if err != nil {
371 return err
372 }
373
374 if args.WriteIfChanged {
375 err := pathtools.WriteFileIfChanged(args.OutputFilePath, buf.Bytes(), 0666)
376 if err != nil {
377 return err
378 }
379 }
380
381 return nil
Colin Cross2fe66872015-03-30 17:20:39 -0700382}
383
Colin Crossb7c69112018-09-18 16:51:43 -0700384func fillPathPairs(fa FileArg, src string, pathMappings *[]pathMapping,
Colin Crossd3216292018-09-14 15:06:31 -0700385 nonDeflatedFiles map[string]bool, noCompression bool) error {
386
Colin Crossb7c69112018-09-18 16:51:43 -0700387 var dest string
388
389 if fa.JunkPaths {
390 dest = filepath.Base(src)
391 } else {
392 var err error
393 dest, err = filepath.Rel(fa.SourcePrefixToStrip, src)
394 if err != nil {
395 return err
396 }
Colin Cross1d98ee22018-09-18 17:05:15 -0700397 if strings.HasPrefix(dest, "../") {
398 return IncorrectRelativeRootError{
399 Path: src,
400 RelativeRoot: fa.SourcePrefixToStrip,
401 }
402 }
403
Nan Zhang9067b042017-03-17 14:04:43 -0700404 }
Colin Crossb7c69112018-09-18 16:51:43 -0700405 dest = filepath.Join(fa.PathPrefixInZip, dest)
Nan Zhang9067b042017-03-17 14:04:43 -0700406
Nan Zhangf281bd82017-04-25 16:47:45 -0700407 zipMethod := zip.Deflate
Colin Crossd3216292018-09-14 15:06:31 -0700408 if _, found := nonDeflatedFiles[dest]; found || noCompression {
Nan Zhangf281bd82017-04-25 16:47:45 -0700409 zipMethod = zip.Store
410 }
411 *pathMappings = append(*pathMappings,
412 pathMapping{dest: dest, src: src, zipMethod: zipMethod})
Nan Zhang9067b042017-03-17 14:04:43 -0700413
414 return nil
415}
416
Jeff Gastona2976952017-08-22 17:51:25 -0700417func jarSort(mappings []pathMapping) {
418 less := func(i int, j int) (smaller bool) {
419 return jar.EntryNamesLess(mappings[i].dest, mappings[j].dest)
420 }
421 sort.SliceStable(mappings, less)
422}
423
Colin Crossf83c1502017-11-10 13:11:02 -0800424func (z *ZipWriter) write(f io.Writer, pathMappings []pathMapping, manifest string, emulateJar bool, parallelJobs int) error {
Dan Willemsen017d8932016-08-04 15:43:03 -0700425 z.errors = make(chan error)
426 defer close(z.errors)
Colin Cross2fe66872015-03-30 17:20:39 -0700427
Dan Willemsen017d8932016-08-04 15:43:03 -0700428 // This channel size can be essentially unlimited -- it's used as a fifo
429 // queue decouple the CPU and IO loads. Directories don't require any
430 // compression time, but still cost some IO. Similar with small files that
431 // can be very fast to compress. Some files that are more difficult to
432 // compress won't take a corresponding longer time writing out.
433 //
434 // The optimum size here depends on your CPU and IO characteristics, and
435 // the the layout of your zip file. 1000 was chosen mostly at random as
436 // something that worked reasonably well for a test file.
437 //
438 // The RateLimit object will put the upper bounds on the number of
439 // parallel compressions and outstanding buffers.
440 z.writeOps = make(chan chan *zipEntry, 1000)
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700441 z.cpuRateLimiter = NewCPURateLimiter(int64(parallelJobs))
Jeff Gaston175f34c2017-08-17 21:43:21 -0700442 z.memoryRateLimiter = NewMemoryRateLimiter(0)
443 defer func() {
444 z.cpuRateLimiter.Stop()
445 z.memoryRateLimiter.Stop()
446 }()
Jeff Gastona2976952017-08-22 17:51:25 -0700447
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700448 if manifest != "" && !emulateJar {
Colin Cross635acc92017-09-12 22:50:46 -0700449 return errors.New("must specify --jar when specifying a manifest via -m")
Jeff Gastona2976952017-08-22 17:51:25 -0700450 }
451
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700452 if emulateJar {
Colin Cross635acc92017-09-12 22:50:46 -0700453 // manifest may be empty, in which case addManifest will fill in a default
454 pathMappings = append(pathMappings, pathMapping{jar.ManifestFile, manifest, zip.Deflate})
455
Jeff Gastona2976952017-08-22 17:51:25 -0700456 jarSort(pathMappings)
457 }
458
Dan Willemsen017d8932016-08-04 15:43:03 -0700459 go func() {
460 var err error
461 defer close(z.writeOps)
462
Nan Zhang9067b042017-03-17 14:04:43 -0700463 for _, ele := range pathMappings {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700464 if emulateJar && ele.dest == jar.ManifestFile {
Jeff Gastoncef50b92017-08-23 15:41:35 -0700465 err = z.addManifest(ele.dest, ele.src, ele.zipMethod)
466 } else {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700467 err = z.addFile(ele.dest, ele.src, ele.zipMethod, emulateJar)
Jeff Gastoncef50b92017-08-23 15:41:35 -0700468 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700469 if err != nil {
470 z.errors <- err
471 return
472 }
473 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700474 }()
475
476 zipw := zip.NewWriter(f)
477
478 var currentWriteOpChan chan *zipEntry
479 var currentWriter io.WriteCloser
480 var currentReaders chan chan io.Reader
481 var currentReader chan io.Reader
482 var done bool
483
484 for !done {
485 var writeOpsChan chan chan *zipEntry
486 var writeOpChan chan *zipEntry
487 var readersChan chan chan io.Reader
488
489 if currentReader != nil {
490 // Only read and process errors
491 } else if currentReaders != nil {
492 readersChan = currentReaders
493 } else if currentWriteOpChan != nil {
494 writeOpChan = currentWriteOpChan
495 } else {
496 writeOpsChan = z.writeOps
497 }
498
499 select {
500 case writeOp, ok := <-writeOpsChan:
501 if !ok {
502 done = true
503 }
504
505 currentWriteOpChan = writeOp
506
507 case op := <-writeOpChan:
508 currentWriteOpChan = nil
509
Colin Crossf83c1502017-11-10 13:11:02 -0800510 var err error
Dan Willemsen017d8932016-08-04 15:43:03 -0700511 if op.fh.Method == zip.Deflate {
512 currentWriter, err = zipw.CreateCompressedHeader(op.fh)
513 } else {
514 var zw io.Writer
Jeff Gastonc5eb66d2017-08-24 14:11:27 -0700515
516 op.fh.CompressedSize64 = op.fh.UncompressedSize64
517
518 zw, err = zipw.CreateHeaderAndroid(op.fh)
Dan Willemsen017d8932016-08-04 15:43:03 -0700519 currentWriter = nopCloser{zw}
520 }
521 if err != nil {
522 return err
523 }
524
525 currentReaders = op.futureReaders
526 if op.futureReaders == nil {
527 currentWriter.Close()
528 currentWriter = nil
529 }
Jeff Gaston175f34c2017-08-17 21:43:21 -0700530 z.memoryRateLimiter.Finish(op.allocatedSize)
Dan Willemsen017d8932016-08-04 15:43:03 -0700531
532 case futureReader, ok := <-readersChan:
533 if !ok {
534 // Done with reading
535 currentWriter.Close()
536 currentWriter = nil
537 currentReaders = nil
538 }
539
540 currentReader = futureReader
541
542 case reader := <-currentReader:
Colin Crossf83c1502017-11-10 13:11:02 -0800543 _, err := io.Copy(currentWriter, reader)
Dan Willemsen017d8932016-08-04 15:43:03 -0700544 if err != nil {
545 return err
546 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700547
548 currentReader = nil
549
Colin Crossf83c1502017-11-10 13:11:02 -0800550 case err := <-z.errors:
Colin Cross2fe66872015-03-30 17:20:39 -0700551 return err
552 }
553 }
554
Dan Willemsen017d8932016-08-04 15:43:03 -0700555 // One last chance to catch an error
556 select {
Colin Crossf83c1502017-11-10 13:11:02 -0800557 case err := <-z.errors:
Dan Willemsen017d8932016-08-04 15:43:03 -0700558 return err
559 default:
560 zipw.Close()
561 return nil
Colin Cross2fe66872015-03-30 17:20:39 -0700562 }
Colin Cross2fe66872015-03-30 17:20:39 -0700563}
564
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700565// imports (possibly with compression) <src> into the zip at sub-path <dest>
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700566func (z *ZipWriter) addFile(dest, src string, method uint16, emulateJar bool) error {
Dan Willemsen017d8932016-08-04 15:43:03 -0700567 var fileSize int64
Dan Willemsen10462b32017-03-15 19:02:51 -0700568 var executable bool
Dan Willemsen017d8932016-08-04 15:43:03 -0700569
Colin Cross09f11052018-09-21 15:12:39 -0700570 var s os.FileInfo
571 var err error
572 if z.followSymlinks {
573 s, err = z.fs.Stat(src)
574 } else {
575 s, err = z.fs.Lstat(src)
576 }
577
578 if err != nil {
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700579 return err
580 } else if s.IsDir() {
Colin Cross957cc4e2015-04-24 15:10:32 -0700581 if z.directories {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700582 return z.writeDirectory(dest, src, emulateJar)
Colin Cross957cc4e2015-04-24 15:10:32 -0700583 }
584 return nil
Dan Willemsen017d8932016-08-04 15:43:03 -0700585 } else {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700586 if err := z.writeDirectory(filepath.Dir(dest), src, emulateJar); err != nil {
Colin Crosse5580972017-08-30 17:40:21 -0700587 return err
588 }
589
590 if prev, exists := z.createdDirs[dest]; exists {
591 return fmt.Errorf("destination %q is both a directory %q and a file %q", dest, prev, src)
592 }
593 if prev, exists := z.createdFiles[dest]; exists {
594 return fmt.Errorf("destination %q has two files %q and %q", dest, prev, src)
595 }
596
597 z.createdFiles[dest] = src
598
599 if s.Mode()&os.ModeSymlink != 0 {
600 return z.writeSymlink(dest, src)
601 } else if !s.Mode().IsRegular() {
602 return fmt.Errorf("%s is not a file, directory, or symlink", src)
603 }
604
Dan Willemsen017d8932016-08-04 15:43:03 -0700605 fileSize = s.Size()
Dan Willemsen10462b32017-03-15 19:02:51 -0700606 executable = s.Mode()&0100 != 0
Colin Cross957cc4e2015-04-24 15:10:32 -0700607 }
608
Colin Cross05518bc2018-09-27 15:06:19 -0700609 r, err := z.fs.Open(src)
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700610 if err != nil {
611 return err
612 }
613
614 header := &zip.FileHeader{
615 Name: dest,
616 Method: method,
617 UncompressedSize64: uint64(fileSize),
618 }
619
620 if executable {
621 header.SetMode(0700)
622 }
623
624 return z.writeFileContents(header, r)
625}
626
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700627func (z *ZipWriter) addManifest(dest string, src string, method uint16) error {
Colin Crosse5580972017-08-30 17:40:21 -0700628 if prev, exists := z.createdDirs[dest]; exists {
629 return fmt.Errorf("destination %q is both a directory %q and a file %q", dest, prev, src)
630 }
631 if prev, exists := z.createdFiles[dest]; exists {
632 return fmt.Errorf("destination %q has two files %q and %q", dest, prev, src)
633 }
634
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700635 if err := z.writeDirectory(filepath.Dir(dest), src, true); err != nil {
Colin Cross635acc92017-09-12 22:50:46 -0700636 return err
Jeff Gastoncef50b92017-08-23 15:41:35 -0700637 }
638
Colin Cross05518bc2018-09-27 15:06:19 -0700639 var contents []byte
640 if src != "" {
641 f, err := z.fs.Open(src)
642 if err != nil {
643 return err
644 }
645
646 contents, err = ioutil.ReadAll(f)
647 f.Close()
648 if err != nil {
649 return err
650 }
651 }
652
653 fh, buf, err := jar.ManifestFileContents(contents)
Colin Cross635acc92017-09-12 22:50:46 -0700654 if err != nil {
655 return err
Jeff Gastoncef50b92017-08-23 15:41:35 -0700656 }
657
Colin Cross635acc92017-09-12 22:50:46 -0700658 reader := &byteReaderCloser{bytes.NewReader(buf), ioutil.NopCloser(nil)}
659
660 return z.writeFileContents(fh, reader)
Jeff Gastoncef50b92017-08-23 15:41:35 -0700661}
662
Colin Cross05518bc2018-09-27 15:06:19 -0700663func (z *ZipWriter) writeFileContents(header *zip.FileHeader, r pathtools.ReaderAtSeekerCloser) (err error) {
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700664
665 header.SetModTime(z.time)
666
Dan Willemsen017d8932016-08-04 15:43:03 -0700667 compressChan := make(chan *zipEntry, 1)
668 z.writeOps <- compressChan
669
670 // Pre-fill a zipEntry, it will be sent in the compressChan once
671 // we're sure about the Method and CRC.
672 ze := &zipEntry{
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700673 fh: header,
Dan Willemsen10462b32017-03-15 19:02:51 -0700674 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700675
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700676 ze.allocatedSize = int64(header.UncompressedSize64)
Jeff Gaston175f34c2017-08-17 21:43:21 -0700677 z.cpuRateLimiter.Request()
678 z.memoryRateLimiter.Request(ze.allocatedSize)
Dan Willemsen017d8932016-08-04 15:43:03 -0700679
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700680 fileSize := int64(header.UncompressedSize64)
681 if fileSize == 0 {
682 fileSize = int64(header.UncompressedSize)
683 }
684
685 if header.Method == zip.Deflate && fileSize >= minParallelFileSize {
Dan Willemsen017d8932016-08-04 15:43:03 -0700686 wg := new(sync.WaitGroup)
687
688 // Allocate enough buffer to hold all readers. We'll limit
689 // this based on actual buffer sizes in RateLimit.
690 ze.futureReaders = make(chan chan io.Reader, (fileSize/parallelBlockSize)+1)
691
692 // Calculate the CRC in the background, since reading the entire
693 // file could take a while.
694 //
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700695 // We could split this up into chunks as well, but it's faster
Dan Willemsen017d8932016-08-04 15:43:03 -0700696 // than the compression. Due to the Go Zip API, we also need to
697 // know the result before we can begin writing the compressed
698 // data out to the zipfile.
699 wg.Add(1)
Jeff Gaston175f34c2017-08-17 21:43:21 -0700700 go z.crcFile(r, ze, compressChan, wg)
Dan Willemsen017d8932016-08-04 15:43:03 -0700701
702 for start := int64(0); start < fileSize; start += parallelBlockSize {
703 sr := io.NewSectionReader(r, start, parallelBlockSize)
704 resultChan := make(chan io.Reader, 1)
705 ze.futureReaders <- resultChan
706
Jeff Gaston175f34c2017-08-17 21:43:21 -0700707 z.cpuRateLimiter.Request()
Dan Willemsen017d8932016-08-04 15:43:03 -0700708
709 last := !(start+parallelBlockSize < fileSize)
710 var dict []byte
711 if start >= windowSize {
712 dict, err = ioutil.ReadAll(io.NewSectionReader(r, start-windowSize, windowSize))
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700713 if err != nil {
714 return err
715 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700716 }
717
718 wg.Add(1)
Jeff Gaston175f34c2017-08-17 21:43:21 -0700719 go z.compressPartialFile(sr, dict, last, resultChan, wg)
Dan Willemsen017d8932016-08-04 15:43:03 -0700720 }
721
722 close(ze.futureReaders)
723
724 // Close the file handle after all readers are done
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700725 go func(wg *sync.WaitGroup, closer io.Closer) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700726 wg.Wait()
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700727 closer.Close()
Dan Willemsen017d8932016-08-04 15:43:03 -0700728 }(wg, r)
729 } else {
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700730 go func() {
731 z.compressWholeFile(ze, r, compressChan)
732 r.Close()
733 }()
Dan Willemsen017d8932016-08-04 15:43:03 -0700734 }
735
736 return nil
737}
738
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700739func (z *ZipWriter) crcFile(r io.Reader, ze *zipEntry, resultChan chan *zipEntry, wg *sync.WaitGroup) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700740 defer wg.Done()
Jeff Gaston175f34c2017-08-17 21:43:21 -0700741 defer z.cpuRateLimiter.Finish()
Dan Willemsen017d8932016-08-04 15:43:03 -0700742
743 crc := crc32.NewIEEE()
744 _, err := io.Copy(crc, r)
745 if err != nil {
746 z.errors <- err
747 return
748 }
749
750 ze.fh.CRC32 = crc.Sum32()
751 resultChan <- ze
752 close(resultChan)
753}
754
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700755func (z *ZipWriter) compressPartialFile(r io.Reader, dict []byte, last bool, resultChan chan io.Reader, wg *sync.WaitGroup) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700756 defer wg.Done()
757
758 result, err := z.compressBlock(r, dict, last)
759 if err != nil {
760 z.errors <- err
761 return
762 }
763
Jeff Gaston175f34c2017-08-17 21:43:21 -0700764 z.cpuRateLimiter.Finish()
765
Dan Willemsen017d8932016-08-04 15:43:03 -0700766 resultChan <- result
767}
768
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700769func (z *ZipWriter) compressBlock(r io.Reader, dict []byte, last bool) (*bytes.Buffer, error) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700770 buf := new(bytes.Buffer)
771 var fw *flate.Writer
772 var err error
773 if len(dict) > 0 {
774 // There's no way to Reset a Writer with a new dictionary, so
775 // don't use the Pool
776 fw, err = flate.NewWriterDict(buf, z.compLevel, dict)
777 } else {
778 var ok bool
779 if fw, ok = z.compressorPool.Get().(*flate.Writer); ok {
780 fw.Reset(buf)
781 } else {
782 fw, err = flate.NewWriter(buf, z.compLevel)
783 }
784 defer z.compressorPool.Put(fw)
785 }
786 if err != nil {
787 return nil, err
788 }
789
790 _, err = io.Copy(fw, r)
791 if err != nil {
792 return nil, err
793 }
794 if last {
795 fw.Close()
796 } else {
797 fw.Flush()
798 }
799
800 return buf, nil
801}
802
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700803func (z *ZipWriter) compressWholeFile(ze *zipEntry, r io.ReadSeeker, compressChan chan *zipEntry) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700804
Dan Willemsen017d8932016-08-04 15:43:03 -0700805 crc := crc32.NewIEEE()
Dan Willemsena8b55022017-03-15 21:49:26 -0700806 _, err := io.Copy(crc, r)
Colin Cross2fe66872015-03-30 17:20:39 -0700807 if err != nil {
Dan Willemsen017d8932016-08-04 15:43:03 -0700808 z.errors <- err
809 return
Colin Cross2fe66872015-03-30 17:20:39 -0700810 }
811
Dan Willemsena8b55022017-03-15 21:49:26 -0700812 ze.fh.CRC32 = crc.Sum32()
Colin Cross2fe66872015-03-30 17:20:39 -0700813
Dan Willemsen017d8932016-08-04 15:43:03 -0700814 _, err = r.Seek(0, 0)
Colin Cross2fe66872015-03-30 17:20:39 -0700815 if err != nil {
Dan Willemsen017d8932016-08-04 15:43:03 -0700816 z.errors <- err
817 return
Colin Cross2fe66872015-03-30 17:20:39 -0700818 }
819
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700820 readFile := func(reader io.ReadSeeker) ([]byte, error) {
821 _, err := reader.Seek(0, 0)
Nan Zhangf281bd82017-04-25 16:47:45 -0700822 if err != nil {
823 return nil, err
824 }
825
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700826 buf, err := ioutil.ReadAll(reader)
Nan Zhangf281bd82017-04-25 16:47:45 -0700827 if err != nil {
828 return nil, err
829 }
830
831 return buf, nil
832 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700833
Dan Willemsena8b55022017-03-15 21:49:26 -0700834 ze.futureReaders = make(chan chan io.Reader, 1)
Dan Willemsen017d8932016-08-04 15:43:03 -0700835 futureReader := make(chan io.Reader, 1)
836 ze.futureReaders <- futureReader
837 close(ze.futureReaders)
838
Nan Zhangf281bd82017-04-25 16:47:45 -0700839 if ze.fh.Method == zip.Deflate {
840 compressed, err := z.compressBlock(r, nil, true)
841 if err != nil {
842 z.errors <- err
843 return
844 }
845 if uint64(compressed.Len()) < ze.fh.UncompressedSize64 {
846 futureReader <- compressed
Nan Zhangf281bd82017-04-25 16:47:45 -0700847 } else {
848 buf, err := readFile(r)
849 if err != nil {
850 z.errors <- err
851 return
852 }
853 ze.fh.Method = zip.Store
854 futureReader <- bytes.NewReader(buf)
Nan Zhangf281bd82017-04-25 16:47:45 -0700855 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700856 } else {
Nan Zhangf281bd82017-04-25 16:47:45 -0700857 buf, err := readFile(r)
Dan Willemsen017d8932016-08-04 15:43:03 -0700858 if err != nil {
859 z.errors <- err
860 return
861 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700862 ze.fh.Method = zip.Store
863 futureReader <- bytes.NewReader(buf)
Dan Willemsen017d8932016-08-04 15:43:03 -0700864 }
Nan Zhangf281bd82017-04-25 16:47:45 -0700865
Jeff Gaston175f34c2017-08-17 21:43:21 -0700866 z.cpuRateLimiter.Finish()
867
Dan Willemsen017d8932016-08-04 15:43:03 -0700868 close(futureReader)
869
870 compressChan <- ze
871 close(compressChan)
Colin Cross2fe66872015-03-30 17:20:39 -0700872}
Colin Crosse19c7932015-04-24 15:08:38 -0700873
Colin Crosse5580972017-08-30 17:40:21 -0700874// writeDirectory annotates that dir is a directory created for the src file or directory, and adds
875// the directory entry to the zip file if directories are enabled.
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700876func (z *ZipWriter) writeDirectory(dir string, src string, emulateJar bool) error {
Jeff Gaston2d174132017-08-15 18:05:56 -0700877 // clean the input
Colin Crosse5580972017-08-30 17:40:21 -0700878 dir = filepath.Clean(dir)
Jeff Gaston2d174132017-08-15 18:05:56 -0700879
880 // discover any uncreated directories in the path
881 zipDirs := []string{}
Colin Crosse5580972017-08-30 17:40:21 -0700882 for dir != "" && dir != "." {
883 if _, exists := z.createdDirs[dir]; exists {
884 break
885 }
Jeff Gaston2d174132017-08-15 18:05:56 -0700886
Colin Crosse5580972017-08-30 17:40:21 -0700887 if prev, exists := z.createdFiles[dir]; exists {
888 return fmt.Errorf("destination %q is both a directory %q and a file %q", dir, src, prev)
889 }
890
891 z.createdDirs[dir] = src
Jeff Gaston2d174132017-08-15 18:05:56 -0700892 // parent directories precede their children
Colin Crosse5580972017-08-30 17:40:21 -0700893 zipDirs = append([]string{dir}, zipDirs...)
Jeff Gaston2d174132017-08-15 18:05:56 -0700894
Colin Crosse5580972017-08-30 17:40:21 -0700895 dir = filepath.Dir(dir)
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700896 }
897
Colin Crosse5580972017-08-30 17:40:21 -0700898 if z.directories {
899 // make a directory entry for each uncreated directory
900 for _, cleanDir := range zipDirs {
Colin Cross635acc92017-09-12 22:50:46 -0700901 var dirHeader *zip.FileHeader
Colin Crosse19c7932015-04-24 15:08:38 -0700902
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700903 if emulateJar && cleanDir+"/" == jar.MetaDir {
Colin Cross635acc92017-09-12 22:50:46 -0700904 dirHeader = jar.MetaDirFileHeader()
905 } else {
906 dirHeader = &zip.FileHeader{
907 Name: cleanDir + "/",
908 }
909 dirHeader.SetMode(0700 | os.ModeDir)
Colin Crosse5580972017-08-30 17:40:21 -0700910 }
Jeff Gaston8edbb3a2017-08-22 20:05:28 -0700911
Colin Cross635acc92017-09-12 22:50:46 -0700912 dirHeader.SetModTime(z.time)
913
Colin Crosse5580972017-08-30 17:40:21 -0700914 ze := make(chan *zipEntry, 1)
915 ze <- &zipEntry{
916 fh: dirHeader,
917 }
918 close(ze)
919 z.writeOps <- ze
Colin Crosse19c7932015-04-24 15:08:38 -0700920 }
Colin Crosse19c7932015-04-24 15:08:38 -0700921 }
922
923 return nil
924}
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700925
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700926func (z *ZipWriter) writeSymlink(rel, file string) error {
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700927 fileHeader := &zip.FileHeader{
928 Name: rel,
929 }
930 fileHeader.SetModTime(z.time)
Colin Cross297d9bc2018-06-22 16:37:47 -0700931 fileHeader.SetMode(0777 | os.ModeSymlink)
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700932
Colin Cross05518bc2018-09-27 15:06:19 -0700933 dest, err := z.fs.Readlink(file)
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700934 if err != nil {
935 return err
936 }
937
Colin Cross297d9bc2018-06-22 16:37:47 -0700938 fileHeader.UncompressedSize64 = uint64(len(dest))
939 fileHeader.CRC32 = crc32.ChecksumIEEE([]byte(dest))
940
Dan Willemsen017d8932016-08-04 15:43:03 -0700941 ze := make(chan *zipEntry, 1)
942 futureReaders := make(chan chan io.Reader, 1)
943 futureReader := make(chan io.Reader, 1)
944 futureReaders <- futureReader
945 close(futureReaders)
946 futureReader <- bytes.NewBufferString(dest)
947 close(futureReader)
948
Dan Willemsen017d8932016-08-04 15:43:03 -0700949 ze <- &zipEntry{
950 fh: fileHeader,
951 futureReaders: futureReaders,
952 }
953 close(ze)
954 z.writeOps <- ze
955
956 return nil
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700957}