blob: 96f4535ae5418385df939e9cf9798ca36d1f1c41 [file] [log] [blame]
Colin Cross2fe66872015-03-30 17:20:39 -07001// Copyright 2015 Google Inc. All rights reserved.
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7// http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
Jeff Gaston11b5c512017-10-12 12:19:14 -070015package zip
Colin Cross2fe66872015-03-30 17:20:39 -070016
17import (
Dan Willemsen017d8932016-08-04 15:43:03 -070018 "bytes"
19 "compress/flate"
Jeff Gastona2976952017-08-22 17:51:25 -070020 "errors"
Colin Cross2fe66872015-03-30 17:20:39 -070021 "fmt"
Dan Willemsen017d8932016-08-04 15:43:03 -070022 "hash/crc32"
Colin Cross2fe66872015-03-30 17:20:39 -070023 "io"
24 "io/ioutil"
Nan Zhang9067b042017-03-17 14:04:43 -070025 "log"
Colin Cross2fe66872015-03-30 17:20:39 -070026 "os"
27 "path/filepath"
Jeff Gastona2976952017-08-22 17:51:25 -070028 "sort"
Colin Cross2fe66872015-03-30 17:20:39 -070029 "strings"
Dan Willemsen017d8932016-08-04 15:43:03 -070030 "sync"
Colin Cross2fe66872015-03-30 17:20:39 -070031 "time"
Nan Zhang674dd932018-01-26 18:30:36 -080032 "unicode"
Dan Willemsen017d8932016-08-04 15:43:03 -070033
Colin Crossf83c1502017-11-10 13:11:02 -080034 "github.com/google/blueprint/pathtools"
35
Jeff Gastona2976952017-08-22 17:51:25 -070036 "android/soong/jar"
Dan Willemsen017d8932016-08-04 15:43:03 -070037 "android/soong/third_party/zip"
Colin Cross2fe66872015-03-30 17:20:39 -070038)
39
Dan Willemsen017d8932016-08-04 15:43:03 -070040// Block size used during parallel compression of a single file.
41const parallelBlockSize = 1 * 1024 * 1024 // 1MB
42
43// Minimum file size to use parallel compression. It requires more
44// flate.Writer allocations, since we can't change the dictionary
45// during Reset
46const minParallelFileSize = parallelBlockSize * 6
47
48// Size of the ZIP compression window (32KB)
49const windowSize = 32 * 1024
50
51type nopCloser struct {
52 io.Writer
53}
54
55func (nopCloser) Close() error {
56 return nil
57}
58
Jeff Gastoncef50b92017-08-23 15:41:35 -070059type byteReaderCloser struct {
Colin Cross635acc92017-09-12 22:50:46 -070060 *bytes.Reader
Jeff Gastoncef50b92017-08-23 15:41:35 -070061 io.Closer
62}
63
Nan Zhang9067b042017-03-17 14:04:43 -070064type pathMapping struct {
65 dest, src string
Nan Zhangf281bd82017-04-25 16:47:45 -070066 zipMethod uint16
67}
68
Jeff Gastonc3bdc972017-10-12 12:18:19 -070069type FileArg struct {
70 PathPrefixInZip, SourcePrefixToStrip string
71 SourceFiles []string
Colin Crossb7c69112018-09-18 16:51:43 -070072 JunkPaths bool
Jeff Gastonc3bdc972017-10-12 12:18:19 -070073 GlobDir string
74}
75
Colin Crossfe945b42018-09-27 15:00:07 -070076type FileArgsBuilder struct {
77 state FileArg
78 err error
79 fs pathtools.FileSystem
80
81 fileArgs []FileArg
82}
83
84func NewFileArgsBuilder() *FileArgsBuilder {
85 return &FileArgsBuilder{
86 fs: pathtools.OsFs,
87 }
88}
89
90func (b *FileArgsBuilder) JunkPaths(v bool) *FileArgsBuilder {
91 b.state.JunkPaths = v
92 b.state.SourcePrefixToStrip = ""
93 return b
94}
95
96func (b *FileArgsBuilder) SourcePrefixToStrip(prefixToStrip string) *FileArgsBuilder {
97 b.state.JunkPaths = false
98 b.state.SourcePrefixToStrip = prefixToStrip
99 return b
100}
101
102func (b *FileArgsBuilder) PathPrefixInZip(rootPrefix string) *FileArgsBuilder {
103 b.state.PathPrefixInZip = rootPrefix
104 return b
105}
106
107func (b *FileArgsBuilder) File(name string) *FileArgsBuilder {
108 if b.err != nil {
109 return b
110 }
111
112 arg := b.state
113 arg.SourceFiles = []string{name}
114 b.fileArgs = append(b.fileArgs, arg)
115 return b
116}
117
118func (b *FileArgsBuilder) Dir(name string) *FileArgsBuilder {
119 if b.err != nil {
120 return b
121 }
122
123 arg := b.state
124 arg.GlobDir = name
125 b.fileArgs = append(b.fileArgs, arg)
126 return b
127}
128
129func (b *FileArgsBuilder) List(name string) *FileArgsBuilder {
130 if b.err != nil {
131 return b
132 }
133
134 f, err := b.fs.Open(name)
135 if err != nil {
136 b.err = err
137 return b
138 }
139 defer f.Close()
140
141 list, err := ioutil.ReadAll(f)
142 if err != nil {
143 b.err = err
144 return b
145 }
146
147 arg := b.state
148 arg.SourceFiles = strings.Split(string(list), "\n")
149 b.fileArgs = append(b.fileArgs, arg)
150 return b
151}
152
153func (b *FileArgsBuilder) Error() error {
154 if b == nil {
155 return nil
156 }
157 return b.err
158}
159
160func (b *FileArgsBuilder) FileArgs() []FileArg {
161 if b == nil {
162 return nil
163 }
164 return b.fileArgs
165}
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700166
167type ZipWriter struct {
Colin Crosse5580972017-08-30 17:40:21 -0700168 time time.Time
169 createdFiles map[string]string
170 createdDirs map[string]string
171 directories bool
Colin Crosse19c7932015-04-24 15:08:38 -0700172
Dan Willemsen017d8932016-08-04 15:43:03 -0700173 errors chan error
174 writeOps chan chan *zipEntry
175
Jeff Gaston175f34c2017-08-17 21:43:21 -0700176 cpuRateLimiter *CPURateLimiter
177 memoryRateLimiter *MemoryRateLimiter
Dan Willemsen017d8932016-08-04 15:43:03 -0700178
179 compressorPool sync.Pool
180 compLevel int
181}
182
183type zipEntry struct {
184 fh *zip.FileHeader
185
186 // List of delayed io.Reader
187 futureReaders chan chan io.Reader
Jeff Gaston175f34c2017-08-17 21:43:21 -0700188
189 // Only used for passing into the MemoryRateLimiter to ensure we
190 // release as much memory as much as we request
191 allocatedSize int64
Colin Cross2fe66872015-03-30 17:20:39 -0700192}
193
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700194type ZipArgs struct {
Colin Crossfe945b42018-09-27 15:00:07 -0700195 FileArgs []FileArg
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700196 OutputFilePath string
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700197 EmulateJar bool
198 AddDirectoryEntriesToZip bool
199 CompressionLevel int
200 ManifestSourcePath string
201 NumParallelJobs int
202 NonDeflatedFiles map[string]bool
Colin Crossf83c1502017-11-10 13:11:02 -0800203 WriteIfChanged bool
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700204}
Colin Cross2fe66872015-03-30 17:20:39 -0700205
Nan Zhang674dd932018-01-26 18:30:36 -0800206const NOQUOTE = '\x00'
207
208func ReadRespFile(bytes []byte) []string {
209 var args []string
210 var arg []rune
211
212 isEscaping := false
213 quotingStart := NOQUOTE
214 for _, c := range string(bytes) {
215 switch {
216 case isEscaping:
217 if quotingStart == '"' {
218 if !(c == '"' || c == '\\') {
219 // '\"' or '\\' will be escaped under double quoting.
220 arg = append(arg, '\\')
221 }
222 }
223 arg = append(arg, c)
224 isEscaping = false
225 case c == '\\' && quotingStart != '\'':
226 isEscaping = true
227 case quotingStart == NOQUOTE && (c == '\'' || c == '"'):
228 quotingStart = c
229 case quotingStart != NOQUOTE && c == quotingStart:
230 quotingStart = NOQUOTE
231 case quotingStart == NOQUOTE && unicode.IsSpace(c):
232 // Current character is a space outside quotes
233 if len(arg) != 0 {
234 args = append(args, string(arg))
235 }
236 arg = arg[:0]
237 default:
238 arg = append(arg, c)
239 }
240 }
241
242 if len(arg) != 0 {
243 args = append(args, string(arg))
244 }
245
246 return args
247}
248
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700249func Run(args ZipArgs) (err error) {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700250 if args.OutputFilePath == "" {
251 return fmt.Errorf("output file path must be nonempty")
Colin Cross2fe66872015-03-30 17:20:39 -0700252 }
253
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700254 if args.EmulateJar {
255 args.AddDirectoryEntriesToZip = true
Jeff Gaston8edbb3a2017-08-22 20:05:28 -0700256 }
257
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700258 w := &ZipWriter{
Colin Crossc7feeff2018-09-26 21:36:44 +0000259 time: jar.DefaultTime,
260 createdDirs: make(map[string]string),
261 createdFiles: make(map[string]string),
262 directories: args.AddDirectoryEntriesToZip,
263 compLevel: args.CompressionLevel,
Colin Cross2fe66872015-03-30 17:20:39 -0700264 }
Nan Zhang9067b042017-03-17 14:04:43 -0700265 pathMappings := []pathMapping{}
Nan Zhang9067b042017-03-17 14:04:43 -0700266
Colin Crossd3216292018-09-14 15:06:31 -0700267 noCompression := args.CompressionLevel == 0
268
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700269 for _, fa := range args.FileArgs {
Colin Cross7f33b812018-09-26 21:36:22 +0000270 srcs := fa.SourceFiles
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700271 if fa.GlobDir != "" {
Colin Cross7f33b812018-09-26 21:36:22 +0000272 srcs = append(srcs, recursiveGlobFiles(fa.GlobDir)...)
Colin Cross7b10cf12017-08-30 14:12:21 -0700273 }
274 for _, src := range srcs {
Colin Crossb7c69112018-09-18 16:51:43 -0700275 err := fillPathPairs(fa, src, &pathMappings, args.NonDeflatedFiles, noCompression)
Colin Crossd3216292018-09-14 15:06:31 -0700276 if err != nil {
Nan Zhang9067b042017-03-17 14:04:43 -0700277 log.Fatal(err)
278 }
279 }
280 }
281
Colin Crossf83c1502017-11-10 13:11:02 -0800282 buf := &bytes.Buffer{}
283 var out io.Writer = buf
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700284
Colin Crossf83c1502017-11-10 13:11:02 -0800285 if !args.WriteIfChanged {
286 f, err := os.Create(args.OutputFilePath)
287 if err != nil {
288 return err
289 }
290
291 defer f.Close()
292 defer func() {
293 if err != nil {
294 os.Remove(args.OutputFilePath)
295 }
296 }()
297
298 out = f
299 }
300
301 err = w.write(out, pathMappings, args.ManifestSourcePath, args.EmulateJar, args.NumParallelJobs)
302 if err != nil {
303 return err
304 }
305
306 if args.WriteIfChanged {
307 err := pathtools.WriteFileIfChanged(args.OutputFilePath, buf.Bytes(), 0666)
308 if err != nil {
309 return err
310 }
311 }
312
313 return nil
Colin Cross2fe66872015-03-30 17:20:39 -0700314}
315
Colin Crossb7c69112018-09-18 16:51:43 -0700316func fillPathPairs(fa FileArg, src string, pathMappings *[]pathMapping,
Colin Crossd3216292018-09-14 15:06:31 -0700317 nonDeflatedFiles map[string]bool, noCompression bool) error {
318
Nan Zhang9067b042017-03-17 14:04:43 -0700319 src = strings.TrimSpace(src)
320 if src == "" {
321 return nil
322 }
323 src = filepath.Clean(src)
Colin Crossb7c69112018-09-18 16:51:43 -0700324 var dest string
325
326 if fa.JunkPaths {
327 dest = filepath.Base(src)
328 } else {
329 var err error
330 dest, err = filepath.Rel(fa.SourcePrefixToStrip, src)
331 if err != nil {
332 return err
333 }
Nan Zhang9067b042017-03-17 14:04:43 -0700334 }
Colin Crossb7c69112018-09-18 16:51:43 -0700335 dest = filepath.Join(fa.PathPrefixInZip, dest)
Nan Zhang9067b042017-03-17 14:04:43 -0700336
Nan Zhangf281bd82017-04-25 16:47:45 -0700337 zipMethod := zip.Deflate
Colin Crossd3216292018-09-14 15:06:31 -0700338 if _, found := nonDeflatedFiles[dest]; found || noCompression {
Nan Zhangf281bd82017-04-25 16:47:45 -0700339 zipMethod = zip.Store
340 }
341 *pathMappings = append(*pathMappings,
342 pathMapping{dest: dest, src: src, zipMethod: zipMethod})
Nan Zhang9067b042017-03-17 14:04:43 -0700343
344 return nil
345}
346
Jeff Gastona2976952017-08-22 17:51:25 -0700347func jarSort(mappings []pathMapping) {
348 less := func(i int, j int) (smaller bool) {
349 return jar.EntryNamesLess(mappings[i].dest, mappings[j].dest)
350 }
351 sort.SliceStable(mappings, less)
352}
353
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700354type readerSeekerCloser interface {
355 io.Reader
356 io.ReaderAt
357 io.Closer
358 io.Seeker
359}
360
Colin Crossf83c1502017-11-10 13:11:02 -0800361func (z *ZipWriter) write(f io.Writer, pathMappings []pathMapping, manifest string, emulateJar bool, parallelJobs int) error {
Dan Willemsen017d8932016-08-04 15:43:03 -0700362 z.errors = make(chan error)
363 defer close(z.errors)
Colin Cross2fe66872015-03-30 17:20:39 -0700364
Dan Willemsen017d8932016-08-04 15:43:03 -0700365 // This channel size can be essentially unlimited -- it's used as a fifo
366 // queue decouple the CPU and IO loads. Directories don't require any
367 // compression time, but still cost some IO. Similar with small files that
368 // can be very fast to compress. Some files that are more difficult to
369 // compress won't take a corresponding longer time writing out.
370 //
371 // The optimum size here depends on your CPU and IO characteristics, and
372 // the the layout of your zip file. 1000 was chosen mostly at random as
373 // something that worked reasonably well for a test file.
374 //
375 // The RateLimit object will put the upper bounds on the number of
376 // parallel compressions and outstanding buffers.
377 z.writeOps = make(chan chan *zipEntry, 1000)
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700378 z.cpuRateLimiter = NewCPURateLimiter(int64(parallelJobs))
Jeff Gaston175f34c2017-08-17 21:43:21 -0700379 z.memoryRateLimiter = NewMemoryRateLimiter(0)
380 defer func() {
381 z.cpuRateLimiter.Stop()
382 z.memoryRateLimiter.Stop()
383 }()
Jeff Gastona2976952017-08-22 17:51:25 -0700384
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700385 if manifest != "" && !emulateJar {
Colin Cross635acc92017-09-12 22:50:46 -0700386 return errors.New("must specify --jar when specifying a manifest via -m")
Jeff Gastona2976952017-08-22 17:51:25 -0700387 }
388
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700389 if emulateJar {
Colin Cross635acc92017-09-12 22:50:46 -0700390 // manifest may be empty, in which case addManifest will fill in a default
391 pathMappings = append(pathMappings, pathMapping{jar.ManifestFile, manifest, zip.Deflate})
392
Jeff Gastona2976952017-08-22 17:51:25 -0700393 jarSort(pathMappings)
394 }
395
Dan Willemsen017d8932016-08-04 15:43:03 -0700396 go func() {
397 var err error
398 defer close(z.writeOps)
399
Nan Zhang9067b042017-03-17 14:04:43 -0700400 for _, ele := range pathMappings {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700401 if emulateJar && ele.dest == jar.ManifestFile {
Jeff Gastoncef50b92017-08-23 15:41:35 -0700402 err = z.addManifest(ele.dest, ele.src, ele.zipMethod)
403 } else {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700404 err = z.addFile(ele.dest, ele.src, ele.zipMethod, emulateJar)
Jeff Gastoncef50b92017-08-23 15:41:35 -0700405 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700406 if err != nil {
407 z.errors <- err
408 return
409 }
410 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700411 }()
412
413 zipw := zip.NewWriter(f)
414
415 var currentWriteOpChan chan *zipEntry
416 var currentWriter io.WriteCloser
417 var currentReaders chan chan io.Reader
418 var currentReader chan io.Reader
419 var done bool
420
421 for !done {
422 var writeOpsChan chan chan *zipEntry
423 var writeOpChan chan *zipEntry
424 var readersChan chan chan io.Reader
425
426 if currentReader != nil {
427 // Only read and process errors
428 } else if currentReaders != nil {
429 readersChan = currentReaders
430 } else if currentWriteOpChan != nil {
431 writeOpChan = currentWriteOpChan
432 } else {
433 writeOpsChan = z.writeOps
434 }
435
436 select {
437 case writeOp, ok := <-writeOpsChan:
438 if !ok {
439 done = true
440 }
441
442 currentWriteOpChan = writeOp
443
444 case op := <-writeOpChan:
445 currentWriteOpChan = nil
446
Colin Crossf83c1502017-11-10 13:11:02 -0800447 var err error
Dan Willemsen017d8932016-08-04 15:43:03 -0700448 if op.fh.Method == zip.Deflate {
449 currentWriter, err = zipw.CreateCompressedHeader(op.fh)
450 } else {
451 var zw io.Writer
Jeff Gastonc5eb66d2017-08-24 14:11:27 -0700452
453 op.fh.CompressedSize64 = op.fh.UncompressedSize64
454
455 zw, err = zipw.CreateHeaderAndroid(op.fh)
Dan Willemsen017d8932016-08-04 15:43:03 -0700456 currentWriter = nopCloser{zw}
457 }
458 if err != nil {
459 return err
460 }
461
462 currentReaders = op.futureReaders
463 if op.futureReaders == nil {
464 currentWriter.Close()
465 currentWriter = nil
466 }
Jeff Gaston175f34c2017-08-17 21:43:21 -0700467 z.memoryRateLimiter.Finish(op.allocatedSize)
Dan Willemsen017d8932016-08-04 15:43:03 -0700468
469 case futureReader, ok := <-readersChan:
470 if !ok {
471 // Done with reading
472 currentWriter.Close()
473 currentWriter = nil
474 currentReaders = nil
475 }
476
477 currentReader = futureReader
478
479 case reader := <-currentReader:
Colin Crossf83c1502017-11-10 13:11:02 -0800480 _, err := io.Copy(currentWriter, reader)
Dan Willemsen017d8932016-08-04 15:43:03 -0700481 if err != nil {
482 return err
483 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700484
485 currentReader = nil
486
Colin Crossf83c1502017-11-10 13:11:02 -0800487 case err := <-z.errors:
Colin Cross2fe66872015-03-30 17:20:39 -0700488 return err
489 }
490 }
491
Dan Willemsen017d8932016-08-04 15:43:03 -0700492 // One last chance to catch an error
493 select {
Colin Crossf83c1502017-11-10 13:11:02 -0800494 case err := <-z.errors:
Dan Willemsen017d8932016-08-04 15:43:03 -0700495 return err
496 default:
497 zipw.Close()
498 return nil
Colin Cross2fe66872015-03-30 17:20:39 -0700499 }
Colin Cross2fe66872015-03-30 17:20:39 -0700500}
501
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700502// imports (possibly with compression) <src> into the zip at sub-path <dest>
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700503func (z *ZipWriter) addFile(dest, src string, method uint16, emulateJar bool) error {
Dan Willemsen017d8932016-08-04 15:43:03 -0700504 var fileSize int64
Dan Willemsen10462b32017-03-15 19:02:51 -0700505 var executable bool
Dan Willemsen017d8932016-08-04 15:43:03 -0700506
Colin Crossc7feeff2018-09-26 21:36:44 +0000507 if s, err := os.Lstat(src); err != nil {
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700508 return err
509 } else if s.IsDir() {
Colin Cross957cc4e2015-04-24 15:10:32 -0700510 if z.directories {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700511 return z.writeDirectory(dest, src, emulateJar)
Colin Cross957cc4e2015-04-24 15:10:32 -0700512 }
513 return nil
Dan Willemsen017d8932016-08-04 15:43:03 -0700514 } else {
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700515 if err := z.writeDirectory(filepath.Dir(dest), src, emulateJar); err != nil {
Colin Crosse5580972017-08-30 17:40:21 -0700516 return err
517 }
518
519 if prev, exists := z.createdDirs[dest]; exists {
520 return fmt.Errorf("destination %q is both a directory %q and a file %q", dest, prev, src)
521 }
522 if prev, exists := z.createdFiles[dest]; exists {
523 return fmt.Errorf("destination %q has two files %q and %q", dest, prev, src)
524 }
525
526 z.createdFiles[dest] = src
527
528 if s.Mode()&os.ModeSymlink != 0 {
529 return z.writeSymlink(dest, src)
530 } else if !s.Mode().IsRegular() {
531 return fmt.Errorf("%s is not a file, directory, or symlink", src)
532 }
533
Dan Willemsen017d8932016-08-04 15:43:03 -0700534 fileSize = s.Size()
Dan Willemsen10462b32017-03-15 19:02:51 -0700535 executable = s.Mode()&0100 != 0
Colin Cross957cc4e2015-04-24 15:10:32 -0700536 }
537
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700538 r, err := os.Open(src)
539 if err != nil {
540 return err
541 }
542
543 header := &zip.FileHeader{
544 Name: dest,
545 Method: method,
546 UncompressedSize64: uint64(fileSize),
547 }
548
549 if executable {
550 header.SetMode(0700)
551 }
552
553 return z.writeFileContents(header, r)
554}
555
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700556func (z *ZipWriter) addManifest(dest string, src string, method uint16) error {
Colin Crosse5580972017-08-30 17:40:21 -0700557 if prev, exists := z.createdDirs[dest]; exists {
558 return fmt.Errorf("destination %q is both a directory %q and a file %q", dest, prev, src)
559 }
560 if prev, exists := z.createdFiles[dest]; exists {
561 return fmt.Errorf("destination %q has two files %q and %q", dest, prev, src)
562 }
563
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700564 if err := z.writeDirectory(filepath.Dir(dest), src, true); err != nil {
Colin Cross635acc92017-09-12 22:50:46 -0700565 return err
Jeff Gastoncef50b92017-08-23 15:41:35 -0700566 }
567
Colin Cross635acc92017-09-12 22:50:46 -0700568 fh, buf, err := jar.ManifestFileContents(src)
569 if err != nil {
570 return err
Jeff Gastoncef50b92017-08-23 15:41:35 -0700571 }
572
Colin Cross635acc92017-09-12 22:50:46 -0700573 reader := &byteReaderCloser{bytes.NewReader(buf), ioutil.NopCloser(nil)}
574
575 return z.writeFileContents(fh, reader)
Jeff Gastoncef50b92017-08-23 15:41:35 -0700576}
577
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700578func (z *ZipWriter) writeFileContents(header *zip.FileHeader, r readerSeekerCloser) (err error) {
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700579
580 header.SetModTime(z.time)
581
Dan Willemsen017d8932016-08-04 15:43:03 -0700582 compressChan := make(chan *zipEntry, 1)
583 z.writeOps <- compressChan
584
585 // Pre-fill a zipEntry, it will be sent in the compressChan once
586 // we're sure about the Method and CRC.
587 ze := &zipEntry{
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700588 fh: header,
Dan Willemsen10462b32017-03-15 19:02:51 -0700589 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700590
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700591 ze.allocatedSize = int64(header.UncompressedSize64)
Jeff Gaston175f34c2017-08-17 21:43:21 -0700592 z.cpuRateLimiter.Request()
593 z.memoryRateLimiter.Request(ze.allocatedSize)
Dan Willemsen017d8932016-08-04 15:43:03 -0700594
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700595 fileSize := int64(header.UncompressedSize64)
596 if fileSize == 0 {
597 fileSize = int64(header.UncompressedSize)
598 }
599
600 if header.Method == zip.Deflate && fileSize >= minParallelFileSize {
Dan Willemsen017d8932016-08-04 15:43:03 -0700601 wg := new(sync.WaitGroup)
602
603 // Allocate enough buffer to hold all readers. We'll limit
604 // this based on actual buffer sizes in RateLimit.
605 ze.futureReaders = make(chan chan io.Reader, (fileSize/parallelBlockSize)+1)
606
607 // Calculate the CRC in the background, since reading the entire
608 // file could take a while.
609 //
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700610 // We could split this up into chunks as well, but it's faster
Dan Willemsen017d8932016-08-04 15:43:03 -0700611 // than the compression. Due to the Go Zip API, we also need to
612 // know the result before we can begin writing the compressed
613 // data out to the zipfile.
614 wg.Add(1)
Jeff Gaston175f34c2017-08-17 21:43:21 -0700615 go z.crcFile(r, ze, compressChan, wg)
Dan Willemsen017d8932016-08-04 15:43:03 -0700616
617 for start := int64(0); start < fileSize; start += parallelBlockSize {
618 sr := io.NewSectionReader(r, start, parallelBlockSize)
619 resultChan := make(chan io.Reader, 1)
620 ze.futureReaders <- resultChan
621
Jeff Gaston175f34c2017-08-17 21:43:21 -0700622 z.cpuRateLimiter.Request()
Dan Willemsen017d8932016-08-04 15:43:03 -0700623
624 last := !(start+parallelBlockSize < fileSize)
625 var dict []byte
626 if start >= windowSize {
627 dict, err = ioutil.ReadAll(io.NewSectionReader(r, start-windowSize, windowSize))
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700628 if err != nil {
629 return err
630 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700631 }
632
633 wg.Add(1)
Jeff Gaston175f34c2017-08-17 21:43:21 -0700634 go z.compressPartialFile(sr, dict, last, resultChan, wg)
Dan Willemsen017d8932016-08-04 15:43:03 -0700635 }
636
637 close(ze.futureReaders)
638
639 // Close the file handle after all readers are done
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700640 go func(wg *sync.WaitGroup, closer io.Closer) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700641 wg.Wait()
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700642 closer.Close()
Dan Willemsen017d8932016-08-04 15:43:03 -0700643 }(wg, r)
644 } else {
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700645 go func() {
646 z.compressWholeFile(ze, r, compressChan)
647 r.Close()
648 }()
Dan Willemsen017d8932016-08-04 15:43:03 -0700649 }
650
651 return nil
652}
653
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700654func (z *ZipWriter) crcFile(r io.Reader, ze *zipEntry, resultChan chan *zipEntry, wg *sync.WaitGroup) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700655 defer wg.Done()
Jeff Gaston175f34c2017-08-17 21:43:21 -0700656 defer z.cpuRateLimiter.Finish()
Dan Willemsen017d8932016-08-04 15:43:03 -0700657
658 crc := crc32.NewIEEE()
659 _, err := io.Copy(crc, r)
660 if err != nil {
661 z.errors <- err
662 return
663 }
664
665 ze.fh.CRC32 = crc.Sum32()
666 resultChan <- ze
667 close(resultChan)
668}
669
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700670func (z *ZipWriter) compressPartialFile(r io.Reader, dict []byte, last bool, resultChan chan io.Reader, wg *sync.WaitGroup) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700671 defer wg.Done()
672
673 result, err := z.compressBlock(r, dict, last)
674 if err != nil {
675 z.errors <- err
676 return
677 }
678
Jeff Gaston175f34c2017-08-17 21:43:21 -0700679 z.cpuRateLimiter.Finish()
680
Dan Willemsen017d8932016-08-04 15:43:03 -0700681 resultChan <- result
682}
683
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700684func (z *ZipWriter) compressBlock(r io.Reader, dict []byte, last bool) (*bytes.Buffer, error) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700685 buf := new(bytes.Buffer)
686 var fw *flate.Writer
687 var err error
688 if len(dict) > 0 {
689 // There's no way to Reset a Writer with a new dictionary, so
690 // don't use the Pool
691 fw, err = flate.NewWriterDict(buf, z.compLevel, dict)
692 } else {
693 var ok bool
694 if fw, ok = z.compressorPool.Get().(*flate.Writer); ok {
695 fw.Reset(buf)
696 } else {
697 fw, err = flate.NewWriter(buf, z.compLevel)
698 }
699 defer z.compressorPool.Put(fw)
700 }
701 if err != nil {
702 return nil, err
703 }
704
705 _, err = io.Copy(fw, r)
706 if err != nil {
707 return nil, err
708 }
709 if last {
710 fw.Close()
711 } else {
712 fw.Flush()
713 }
714
715 return buf, nil
716}
717
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700718func (z *ZipWriter) compressWholeFile(ze *zipEntry, r io.ReadSeeker, compressChan chan *zipEntry) {
Dan Willemsen017d8932016-08-04 15:43:03 -0700719
Dan Willemsen017d8932016-08-04 15:43:03 -0700720 crc := crc32.NewIEEE()
Dan Willemsena8b55022017-03-15 21:49:26 -0700721 _, err := io.Copy(crc, r)
Colin Cross2fe66872015-03-30 17:20:39 -0700722 if err != nil {
Dan Willemsen017d8932016-08-04 15:43:03 -0700723 z.errors <- err
724 return
Colin Cross2fe66872015-03-30 17:20:39 -0700725 }
726
Dan Willemsena8b55022017-03-15 21:49:26 -0700727 ze.fh.CRC32 = crc.Sum32()
Colin Cross2fe66872015-03-30 17:20:39 -0700728
Dan Willemsen017d8932016-08-04 15:43:03 -0700729 _, err = r.Seek(0, 0)
Colin Cross2fe66872015-03-30 17:20:39 -0700730 if err != nil {
Dan Willemsen017d8932016-08-04 15:43:03 -0700731 z.errors <- err
732 return
Colin Cross2fe66872015-03-30 17:20:39 -0700733 }
734
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700735 readFile := func(reader io.ReadSeeker) ([]byte, error) {
736 _, err := reader.Seek(0, 0)
Nan Zhangf281bd82017-04-25 16:47:45 -0700737 if err != nil {
738 return nil, err
739 }
740
Jeff Gaston66dd6e52017-08-23 15:12:48 -0700741 buf, err := ioutil.ReadAll(reader)
Nan Zhangf281bd82017-04-25 16:47:45 -0700742 if err != nil {
743 return nil, err
744 }
745
746 return buf, nil
747 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700748
Dan Willemsena8b55022017-03-15 21:49:26 -0700749 ze.futureReaders = make(chan chan io.Reader, 1)
Dan Willemsen017d8932016-08-04 15:43:03 -0700750 futureReader := make(chan io.Reader, 1)
751 ze.futureReaders <- futureReader
752 close(ze.futureReaders)
753
Nan Zhangf281bd82017-04-25 16:47:45 -0700754 if ze.fh.Method == zip.Deflate {
755 compressed, err := z.compressBlock(r, nil, true)
756 if err != nil {
757 z.errors <- err
758 return
759 }
760 if uint64(compressed.Len()) < ze.fh.UncompressedSize64 {
761 futureReader <- compressed
Nan Zhangf281bd82017-04-25 16:47:45 -0700762 } else {
763 buf, err := readFile(r)
764 if err != nil {
765 z.errors <- err
766 return
767 }
768 ze.fh.Method = zip.Store
769 futureReader <- bytes.NewReader(buf)
Nan Zhangf281bd82017-04-25 16:47:45 -0700770 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700771 } else {
Nan Zhangf281bd82017-04-25 16:47:45 -0700772 buf, err := readFile(r)
Dan Willemsen017d8932016-08-04 15:43:03 -0700773 if err != nil {
774 z.errors <- err
775 return
776 }
Dan Willemsen017d8932016-08-04 15:43:03 -0700777 ze.fh.Method = zip.Store
778 futureReader <- bytes.NewReader(buf)
Dan Willemsen017d8932016-08-04 15:43:03 -0700779 }
Nan Zhangf281bd82017-04-25 16:47:45 -0700780
Jeff Gaston175f34c2017-08-17 21:43:21 -0700781 z.cpuRateLimiter.Finish()
782
Dan Willemsen017d8932016-08-04 15:43:03 -0700783 close(futureReader)
784
785 compressChan <- ze
786 close(compressChan)
Colin Cross2fe66872015-03-30 17:20:39 -0700787}
Colin Crosse19c7932015-04-24 15:08:38 -0700788
Colin Crosse5580972017-08-30 17:40:21 -0700789// writeDirectory annotates that dir is a directory created for the src file or directory, and adds
790// the directory entry to the zip file if directories are enabled.
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700791func (z *ZipWriter) writeDirectory(dir string, src string, emulateJar bool) error {
Jeff Gaston2d174132017-08-15 18:05:56 -0700792 // clean the input
Colin Crosse5580972017-08-30 17:40:21 -0700793 dir = filepath.Clean(dir)
Jeff Gaston2d174132017-08-15 18:05:56 -0700794
795 // discover any uncreated directories in the path
796 zipDirs := []string{}
Colin Crosse5580972017-08-30 17:40:21 -0700797 for dir != "" && dir != "." {
798 if _, exists := z.createdDirs[dir]; exists {
799 break
800 }
Jeff Gaston2d174132017-08-15 18:05:56 -0700801
Colin Crosse5580972017-08-30 17:40:21 -0700802 if prev, exists := z.createdFiles[dir]; exists {
803 return fmt.Errorf("destination %q is both a directory %q and a file %q", dir, src, prev)
804 }
805
806 z.createdDirs[dir] = src
Jeff Gaston2d174132017-08-15 18:05:56 -0700807 // parent directories precede their children
Colin Crosse5580972017-08-30 17:40:21 -0700808 zipDirs = append([]string{dir}, zipDirs...)
Jeff Gaston2d174132017-08-15 18:05:56 -0700809
Colin Crosse5580972017-08-30 17:40:21 -0700810 dir = filepath.Dir(dir)
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700811 }
812
Colin Crosse5580972017-08-30 17:40:21 -0700813 if z.directories {
814 // make a directory entry for each uncreated directory
815 for _, cleanDir := range zipDirs {
Colin Cross635acc92017-09-12 22:50:46 -0700816 var dirHeader *zip.FileHeader
Colin Crosse19c7932015-04-24 15:08:38 -0700817
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700818 if emulateJar && cleanDir+"/" == jar.MetaDir {
Colin Cross635acc92017-09-12 22:50:46 -0700819 dirHeader = jar.MetaDirFileHeader()
820 } else {
821 dirHeader = &zip.FileHeader{
822 Name: cleanDir + "/",
823 }
824 dirHeader.SetMode(0700 | os.ModeDir)
Colin Crosse5580972017-08-30 17:40:21 -0700825 }
Jeff Gaston8edbb3a2017-08-22 20:05:28 -0700826
Colin Cross635acc92017-09-12 22:50:46 -0700827 dirHeader.SetModTime(z.time)
828
Colin Crosse5580972017-08-30 17:40:21 -0700829 ze := make(chan *zipEntry, 1)
830 ze <- &zipEntry{
831 fh: dirHeader,
832 }
833 close(ze)
834 z.writeOps <- ze
Colin Crosse19c7932015-04-24 15:08:38 -0700835 }
Colin Crosse19c7932015-04-24 15:08:38 -0700836 }
837
838 return nil
839}
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700840
Jeff Gastonc3bdc972017-10-12 12:18:19 -0700841func (z *ZipWriter) writeSymlink(rel, file string) error {
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700842 fileHeader := &zip.FileHeader{
843 Name: rel,
844 }
845 fileHeader.SetModTime(z.time)
Colin Cross297d9bc2018-06-22 16:37:47 -0700846 fileHeader.SetMode(0777 | os.ModeSymlink)
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700847
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700848 dest, err := os.Readlink(file)
849 if err != nil {
850 return err
851 }
852
Colin Cross297d9bc2018-06-22 16:37:47 -0700853 fileHeader.UncompressedSize64 = uint64(len(dest))
854 fileHeader.CRC32 = crc32.ChecksumIEEE([]byte(dest))
855
Dan Willemsen017d8932016-08-04 15:43:03 -0700856 ze := make(chan *zipEntry, 1)
857 futureReaders := make(chan chan io.Reader, 1)
858 futureReader := make(chan io.Reader, 1)
859 futureReaders <- futureReader
860 close(futureReaders)
861 futureReader <- bytes.NewBufferString(dest)
862 close(futureReader)
863
Dan Willemsen017d8932016-08-04 15:43:03 -0700864 ze <- &zipEntry{
865 fh: fileHeader,
866 futureReaders: futureReaders,
867 }
868 close(ze)
869 z.writeOps <- ze
870
871 return nil
Dan Willemsena59a3bc2016-08-03 17:47:23 -0700872}
Colin Cross7b10cf12017-08-30 14:12:21 -0700873
874func recursiveGlobFiles(path string) []string {
875 var files []string
876 filepath.Walk(path, func(path string, info os.FileInfo, err error) error {
877 if !info.IsDir() {
878 files = append(files, path)
879 }
880 return nil
881 })
882
883 return files
884}