Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 1 | // Copyright 2017 Google Inc. All rights reserved. |
| 2 | // |
| 3 | // Licensed under the Apache License, Version 2.0 (the "License"); |
| 4 | // you may not use this file except in compliance with the License. |
| 5 | // You may obtain a copy of the License at |
| 6 | // |
| 7 | // http://www.apache.org/licenses/LICENSE-2.0 |
| 8 | // |
| 9 | // Unless required by applicable law or agreed to in writing, software |
| 10 | // distributed under the License is distributed on an "AS IS" BASIS, |
| 11 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 12 | // See the License for the specific language governing permissions and |
| 13 | // limitations under the License. |
| 14 | |
| 15 | package main |
| 16 | |
| 17 | import ( |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 18 | "errors" |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 19 | "flag" |
| 20 | "fmt" |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 21 | "hash/crc32" |
Dan Willemsen | 263dde7 | 2018-11-15 19:15:02 -0800 | [diff] [blame] | 22 | "io" |
Nan Zhang | 5925b0f | 2017-12-19 15:13:40 -0800 | [diff] [blame] | 23 | "io/ioutil" |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 24 | "log" |
| 25 | "os" |
Nan Zhang | 13f4cf5 | 2017-09-19 18:42:01 -0700 | [diff] [blame] | 26 | "path/filepath" |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 27 | "sort" |
Colin Cross | 4c03f68 | 2018-07-15 08:16:31 -0700 | [diff] [blame] | 28 | |
| 29 | "github.com/google/blueprint/pathtools" |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 30 | |
| 31 | "android/soong/jar" |
| 32 | "android/soong/third_party/zip" |
| 33 | ) |
| 34 | |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 35 | type fileList []string |
Nan Zhang | d5998cc | 2017-09-13 13:17:43 -0700 | [diff] [blame] | 36 | |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 37 | func (f *fileList) String() string { |
Nan Zhang | d5998cc | 2017-09-13 13:17:43 -0700 | [diff] [blame] | 38 | return `""` |
| 39 | } |
| 40 | |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 41 | func (f *fileList) Set(name string) error { |
| 42 | *f = append(*f, filepath.Clean(name)) |
Nan Zhang | 13f4cf5 | 2017-09-19 18:42:01 -0700 | [diff] [blame] | 43 | |
| 44 | return nil |
| 45 | } |
| 46 | |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 47 | type zipsToNotStripSet map[string]bool |
Nan Zhang | 13f4cf5 | 2017-09-19 18:42:01 -0700 | [diff] [blame] | 48 | |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 49 | func (s zipsToNotStripSet) String() string { |
Nan Zhang | 13f4cf5 | 2017-09-19 18:42:01 -0700 | [diff] [blame] | 50 | return `""` |
| 51 | } |
| 52 | |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 53 | func (s zipsToNotStripSet) Set(zip_path string) error { |
| 54 | s[zip_path] = true |
Nan Zhang | d5998cc | 2017-09-13 13:17:43 -0700 | [diff] [blame] | 55 | |
| 56 | return nil |
| 57 | } |
| 58 | |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 59 | var ( |
Colin Cross | e909e1e | 2017-11-22 14:09:40 -0800 | [diff] [blame] | 60 | sortEntries = flag.Bool("s", false, "sort entries (defaults to the order from the input zip files)") |
| 61 | emulateJar = flag.Bool("j", false, "sort zip entries using jar ordering (META-INF first)") |
Nan Zhang | 5925b0f | 2017-12-19 15:13:40 -0800 | [diff] [blame] | 62 | emulatePar = flag.Bool("p", false, "merge zip entries based on par format") |
Colin Cross | e909e1e | 2017-11-22 14:09:40 -0800 | [diff] [blame] | 63 | stripDirs fileList |
| 64 | stripFiles fileList |
| 65 | zipsToNotStrip = make(zipsToNotStripSet) |
| 66 | stripDirEntries = flag.Bool("D", false, "strip directory entries from the output zip file") |
| 67 | manifest = flag.String("m", "", "manifest file to insert in jar") |
Nan Zhang | 1db8540 | 2017-12-18 13:20:23 -0800 | [diff] [blame] | 68 | pyMain = flag.String("pm", "", "__main__.py file to insert in par") |
Nan Zhang | 5925b0f | 2017-12-19 15:13:40 -0800 | [diff] [blame] | 69 | entrypoint = flag.String("e", "", "par entrypoint file to insert in par") |
Dan Willemsen | 263dde7 | 2018-11-15 19:15:02 -0800 | [diff] [blame] | 70 | prefix = flag.String("prefix", "", "A file to prefix to the zip file") |
Colin Cross | e909e1e | 2017-11-22 14:09:40 -0800 | [diff] [blame] | 71 | ignoreDuplicates = flag.Bool("ignore-duplicates", false, "take each entry from the first zip it exists in and don't warn") |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 72 | ) |
| 73 | |
Nan Zhang | d5998cc | 2017-09-13 13:17:43 -0700 | [diff] [blame] | 74 | func init() { |
Colin Cross | 4c03f68 | 2018-07-15 08:16:31 -0700 | [diff] [blame] | 75 | flag.Var(&stripDirs, "stripDir", "directories to be excluded from the output zip, accepts wildcards") |
| 76 | flag.Var(&stripFiles, "stripFile", "files to be excluded from the output zip, accepts wildcards") |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 77 | flag.Var(&zipsToNotStrip, "zipToNotStrip", "the input zip file which is not applicable for stripping") |
Nan Zhang | d5998cc | 2017-09-13 13:17:43 -0700 | [diff] [blame] | 78 | } |
| 79 | |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 80 | func main() { |
| 81 | flag.Usage = func() { |
Dan Willemsen | 263dde7 | 2018-11-15 19:15:02 -0800 | [diff] [blame] | 82 | fmt.Fprintln(os.Stderr, "usage: merge_zips [-jpsD] [-m manifest] [--prefix script] [-e entrypoint] [-pm __main__.py] output [inputs...]") |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 83 | flag.PrintDefaults() |
| 84 | } |
| 85 | |
| 86 | // parse args |
| 87 | flag.Parse() |
| 88 | args := flag.Args() |
Colin Cross | 5c6ecc1 | 2017-10-23 18:12:27 -0700 | [diff] [blame] | 89 | if len(args) < 1 { |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 90 | flag.Usage() |
| 91 | os.Exit(1) |
| 92 | } |
| 93 | outputPath := args[0] |
| 94 | inputs := args[1:] |
| 95 | |
| 96 | log.SetFlags(log.Lshortfile) |
| 97 | |
| 98 | // make writer |
| 99 | output, err := os.Create(outputPath) |
| 100 | if err != nil { |
| 101 | log.Fatal(err) |
| 102 | } |
| 103 | defer output.Close() |
Dan Willemsen | 263dde7 | 2018-11-15 19:15:02 -0800 | [diff] [blame] | 104 | |
| 105 | var offset int64 |
| 106 | if *prefix != "" { |
| 107 | prefixFile, err := os.Open(*prefix) |
| 108 | if err != nil { |
| 109 | log.Fatal(err) |
| 110 | } |
| 111 | offset, err = io.Copy(output, prefixFile) |
| 112 | if err != nil { |
| 113 | log.Fatal(err) |
| 114 | } |
| 115 | } |
| 116 | |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 117 | writer := zip.NewWriter(output) |
| 118 | defer func() { |
| 119 | err := writer.Close() |
| 120 | if err != nil { |
| 121 | log.Fatal(err) |
| 122 | } |
| 123 | }() |
Dan Willemsen | 263dde7 | 2018-11-15 19:15:02 -0800 | [diff] [blame] | 124 | writer.SetOffset(offset) |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 125 | |
| 126 | // make readers |
| 127 | readers := []namedZipReader{} |
| 128 | for _, input := range inputs { |
| 129 | reader, err := zip.OpenReader(input) |
| 130 | if err != nil { |
| 131 | log.Fatal(err) |
| 132 | } |
| 133 | defer reader.Close() |
Colin Cross | 2486065 | 2018-07-14 22:19:14 -0700 | [diff] [blame] | 134 | namedReader := namedZipReader{path: input, reader: &reader.Reader} |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 135 | readers = append(readers, namedReader) |
| 136 | } |
| 137 | |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 138 | if *manifest != "" && !*emulateJar { |
| 139 | log.Fatal(errors.New("must specify -j when specifying a manifest via -m")) |
| 140 | } |
| 141 | |
Nan Zhang | 5925b0f | 2017-12-19 15:13:40 -0800 | [diff] [blame] | 142 | if *entrypoint != "" && !*emulatePar { |
| 143 | log.Fatal(errors.New("must specify -p when specifying a entrypoint via -e")) |
| 144 | } |
| 145 | |
Nan Zhang | 1db8540 | 2017-12-18 13:20:23 -0800 | [diff] [blame] | 146 | if *pyMain != "" && !*emulatePar { |
| 147 | log.Fatal(errors.New("must specify -p when specifying a Python __main__.py via -pm")) |
| 148 | } |
| 149 | |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 150 | // do merge |
Nan Zhang | 1db8540 | 2017-12-18 13:20:23 -0800 | [diff] [blame] | 151 | err = mergeZips(readers, writer, *manifest, *entrypoint, *pyMain, *sortEntries, *emulateJar, *emulatePar, |
Colin Cross | 2486065 | 2018-07-14 22:19:14 -0700 | [diff] [blame] | 152 | *stripDirEntries, *ignoreDuplicates, []string(stripFiles), []string(stripDirs), map[string]bool(zipsToNotStrip)) |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 153 | if err != nil { |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 154 | log.Fatal(err) |
| 155 | } |
| 156 | } |
| 157 | |
| 158 | // a namedZipReader reads a .zip file and can say which file it's reading |
| 159 | type namedZipReader struct { |
| 160 | path string |
Colin Cross | 2486065 | 2018-07-14 22:19:14 -0700 | [diff] [blame] | 161 | reader *zip.Reader |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 162 | } |
| 163 | |
| 164 | // a zipEntryPath refers to a file contained in a zip |
| 165 | type zipEntryPath struct { |
| 166 | zipName string |
| 167 | entryName string |
| 168 | } |
| 169 | |
| 170 | func (p zipEntryPath) String() string { |
| 171 | return p.zipName + "/" + p.entryName |
| 172 | } |
| 173 | |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 174 | // a zipEntry is a zipSource that pulls its content from another zip |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 175 | type zipEntry struct { |
| 176 | path zipEntryPath |
| 177 | content *zip.File |
| 178 | } |
| 179 | |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 180 | func (ze zipEntry) String() string { |
| 181 | return ze.path.String() |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 182 | } |
| 183 | |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 184 | func (ze zipEntry) IsDir() bool { |
| 185 | return ze.content.FileInfo().IsDir() |
| 186 | } |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 187 | |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 188 | func (ze zipEntry) CRC32() uint32 { |
| 189 | return ze.content.FileHeader.CRC32 |
| 190 | } |
| 191 | |
Colin Cross | dc1e829 | 2018-10-17 15:05:56 -0700 | [diff] [blame] | 192 | func (ze zipEntry) Size() uint64 { |
| 193 | return ze.content.FileHeader.UncompressedSize64 |
| 194 | } |
| 195 | |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 196 | func (ze zipEntry) WriteToZip(dest string, zw *zip.Writer) error { |
| 197 | return zw.CopyFrom(ze.content, dest) |
| 198 | } |
| 199 | |
| 200 | // a bufferEntry is a zipSource that pulls its content from a []byte |
| 201 | type bufferEntry struct { |
| 202 | fh *zip.FileHeader |
| 203 | content []byte |
| 204 | } |
| 205 | |
| 206 | func (be bufferEntry) String() string { |
| 207 | return "internal buffer" |
| 208 | } |
| 209 | |
| 210 | func (be bufferEntry) IsDir() bool { |
| 211 | return be.fh.FileInfo().IsDir() |
| 212 | } |
| 213 | |
| 214 | func (be bufferEntry) CRC32() uint32 { |
| 215 | return crc32.ChecksumIEEE(be.content) |
| 216 | } |
| 217 | |
Colin Cross | dc1e829 | 2018-10-17 15:05:56 -0700 | [diff] [blame] | 218 | func (be bufferEntry) Size() uint64 { |
| 219 | return uint64(len(be.content)) |
| 220 | } |
| 221 | |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 222 | func (be bufferEntry) WriteToZip(dest string, zw *zip.Writer) error { |
| 223 | w, err := zw.CreateHeader(be.fh) |
| 224 | if err != nil { |
| 225 | return err |
| 226 | } |
| 227 | |
| 228 | if !be.IsDir() { |
| 229 | _, err = w.Write(be.content) |
| 230 | if err != nil { |
| 231 | return err |
| 232 | } |
| 233 | } |
| 234 | |
| 235 | return nil |
| 236 | } |
| 237 | |
| 238 | type zipSource interface { |
| 239 | String() string |
| 240 | IsDir() bool |
| 241 | CRC32() uint32 |
Colin Cross | dc1e829 | 2018-10-17 15:05:56 -0700 | [diff] [blame] | 242 | Size() uint64 |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 243 | WriteToZip(dest string, zw *zip.Writer) error |
| 244 | } |
| 245 | |
| 246 | // a fileMapping specifies to copy a zip entry from one place to another |
| 247 | type fileMapping struct { |
| 248 | dest string |
| 249 | source zipSource |
| 250 | } |
| 251 | |
Nan Zhang | 1db8540 | 2017-12-18 13:20:23 -0800 | [diff] [blame] | 252 | func mergeZips(readers []namedZipReader, writer *zip.Writer, manifest, entrypoint, pyMain string, |
Colin Cross | 2486065 | 2018-07-14 22:19:14 -0700 | [diff] [blame] | 253 | sortEntries, emulateJar, emulatePar, stripDirEntries, ignoreDuplicates bool, |
| 254 | stripFiles, stripDirs []string, zipsToNotStrip map[string]bool) error { |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 255 | |
| 256 | sourceByDest := make(map[string]zipSource, 0) |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 257 | orderedMappings := []fileMapping{} |
| 258 | |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 259 | // if dest already exists returns a non-null zipSource for the existing source |
| 260 | addMapping := func(dest string, source zipSource) zipSource { |
| 261 | mapKey := filepath.Clean(dest) |
| 262 | if existingSource, exists := sourceByDest[mapKey]; exists { |
| 263 | return existingSource |
| 264 | } |
| 265 | |
| 266 | sourceByDest[mapKey] = source |
| 267 | orderedMappings = append(orderedMappings, fileMapping{source: source, dest: dest}) |
| 268 | return nil |
| 269 | } |
| 270 | |
| 271 | if manifest != "" { |
| 272 | if !stripDirEntries { |
| 273 | dirHeader := jar.MetaDirFileHeader() |
| 274 | dirSource := bufferEntry{dirHeader, nil} |
| 275 | addMapping(jar.MetaDir, dirSource) |
| 276 | } |
| 277 | |
Colin Cross | 05518bc | 2018-09-27 15:06:19 -0700 | [diff] [blame] | 278 | contents, err := ioutil.ReadFile(manifest) |
| 279 | if err != nil { |
| 280 | return err |
| 281 | } |
| 282 | |
| 283 | fh, buf, err := jar.ManifestFileContents(contents) |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 284 | if err != nil { |
| 285 | return err |
| 286 | } |
| 287 | |
| 288 | fileSource := bufferEntry{fh, buf} |
| 289 | addMapping(jar.ManifestFile, fileSource) |
| 290 | } |
| 291 | |
Nan Zhang | 5925b0f | 2017-12-19 15:13:40 -0800 | [diff] [blame] | 292 | if entrypoint != "" { |
| 293 | buf, err := ioutil.ReadFile(entrypoint) |
| 294 | if err != nil { |
| 295 | return err |
| 296 | } |
| 297 | fh := &zip.FileHeader{ |
| 298 | Name: "entry_point.txt", |
| 299 | Method: zip.Store, |
| 300 | UncompressedSize64: uint64(len(buf)), |
| 301 | } |
| 302 | fh.SetMode(0700) |
| 303 | fh.SetModTime(jar.DefaultTime) |
| 304 | fileSource := bufferEntry{fh, buf} |
| 305 | addMapping("entry_point.txt", fileSource) |
| 306 | } |
| 307 | |
Nan Zhang | 1db8540 | 2017-12-18 13:20:23 -0800 | [diff] [blame] | 308 | if pyMain != "" { |
| 309 | buf, err := ioutil.ReadFile(pyMain) |
| 310 | if err != nil { |
| 311 | return err |
| 312 | } |
| 313 | fh := &zip.FileHeader{ |
| 314 | Name: "__main__.py", |
| 315 | Method: zip.Store, |
| 316 | UncompressedSize64: uint64(len(buf)), |
| 317 | } |
| 318 | fh.SetMode(0700) |
| 319 | fh.SetModTime(jar.DefaultTime) |
| 320 | fileSource := bufferEntry{fh, buf} |
| 321 | addMapping("__main__.py", fileSource) |
| 322 | } |
| 323 | |
Nan Zhang | 5925b0f | 2017-12-19 15:13:40 -0800 | [diff] [blame] | 324 | if emulatePar { |
| 325 | // the runfiles packages needs to be populated with "__init__.py". |
| 326 | newPyPkgs := []string{} |
| 327 | // the runfiles dirs have been treated as packages. |
| 328 | existingPyPkgSet := make(map[string]bool) |
| 329 | // put existing __init__.py files to a set first. This set is used for preventing |
| 330 | // generated __init__.py files from overwriting existing ones. |
| 331 | for _, namedReader := range readers { |
| 332 | for _, file := range namedReader.reader.File { |
| 333 | if filepath.Base(file.Name) != "__init__.py" { |
| 334 | continue |
| 335 | } |
| 336 | pyPkg := pathBeforeLastSlash(file.Name) |
| 337 | if _, found := existingPyPkgSet[pyPkg]; found { |
| 338 | panic(fmt.Errorf("found __init__.py path duplicates during pars merging: %q.", file.Name)) |
| 339 | } else { |
| 340 | existingPyPkgSet[pyPkg] = true |
| 341 | } |
| 342 | } |
| 343 | } |
| 344 | for _, namedReader := range readers { |
| 345 | for _, file := range namedReader.reader.File { |
| 346 | var parentPath string /* the path after trimming last "/" */ |
| 347 | if filepath.Base(file.Name) == "__init__.py" { |
| 348 | // for existing __init__.py files, we should trim last "/" for twice. |
| 349 | // eg. a/b/c/__init__.py ---> a/b |
| 350 | parentPath = pathBeforeLastSlash(pathBeforeLastSlash(file.Name)) |
| 351 | } else { |
| 352 | parentPath = pathBeforeLastSlash(file.Name) |
| 353 | } |
| 354 | populateNewPyPkgs(parentPath, existingPyPkgSet, &newPyPkgs) |
| 355 | } |
| 356 | } |
| 357 | for _, pkg := range newPyPkgs { |
| 358 | var emptyBuf []byte |
| 359 | fh := &zip.FileHeader{ |
| 360 | Name: filepath.Join(pkg, "__init__.py"), |
| 361 | Method: zip.Store, |
| 362 | UncompressedSize64: uint64(len(emptyBuf)), |
| 363 | } |
| 364 | fh.SetMode(0700) |
| 365 | fh.SetModTime(jar.DefaultTime) |
| 366 | fileSource := bufferEntry{fh, emptyBuf} |
| 367 | addMapping(filepath.Join(pkg, "__init__.py"), fileSource) |
| 368 | } |
| 369 | } |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 370 | for _, namedReader := range readers { |
Nan Zhang | 13f4cf5 | 2017-09-19 18:42:01 -0700 | [diff] [blame] | 371 | _, skipStripThisZip := zipsToNotStrip[namedReader.path] |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 372 | for _, file := range namedReader.reader.File { |
Colin Cross | 4c03f68 | 2018-07-15 08:16:31 -0700 | [diff] [blame] | 373 | if !skipStripThisZip { |
| 374 | if skip, err := shouldStripEntry(emulateJar, stripFiles, stripDirs, file.Name); err != nil { |
| 375 | return err |
| 376 | } else if skip { |
| 377 | continue |
| 378 | } |
Nan Zhang | d5998cc | 2017-09-13 13:17:43 -0700 | [diff] [blame] | 379 | } |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 380 | |
| 381 | if stripDirEntries && file.FileInfo().IsDir() { |
| 382 | continue |
| 383 | } |
| 384 | |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 385 | // check for other files or directories destined for the same path |
| 386 | dest := file.Name |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 387 | |
| 388 | // make a new entry to add |
| 389 | source := zipEntry{path: zipEntryPath{zipName: namedReader.path, entryName: file.Name}, content: file} |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 390 | |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 391 | if existingSource := addMapping(dest, source); existingSource != nil { |
Colin Cross | 3454031 | 2017-09-06 12:52:37 -0700 | [diff] [blame] | 392 | // handle duplicates |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 393 | if existingSource.IsDir() != source.IsDir() { |
Colin Cross | 3454031 | 2017-09-06 12:52:37 -0700 | [diff] [blame] | 394 | return fmt.Errorf("Directory/file mismatch at %v from %v and %v\n", |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 395 | dest, existingSource, source) |
Colin Cross | 3454031 | 2017-09-06 12:52:37 -0700 | [diff] [blame] | 396 | } |
Colin Cross | dc1e829 | 2018-10-17 15:05:56 -0700 | [diff] [blame] | 397 | |
Colin Cross | e909e1e | 2017-11-22 14:09:40 -0800 | [diff] [blame] | 398 | if ignoreDuplicates { |
| 399 | continue |
| 400 | } |
Colin Cross | dc1e829 | 2018-10-17 15:05:56 -0700 | [diff] [blame] | 401 | |
Colin Cross | 3454031 | 2017-09-06 12:52:37 -0700 | [diff] [blame] | 402 | if emulateJar && |
| 403 | file.Name == jar.ManifestFile || file.Name == jar.ModuleInfoClass { |
| 404 | // Skip manifest and module info files that are not from the first input file |
| 405 | continue |
| 406 | } |
Colin Cross | dc1e829 | 2018-10-17 15:05:56 -0700 | [diff] [blame] | 407 | |
| 408 | if source.IsDir() { |
| 409 | continue |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 410 | } |
Colin Cross | dc1e829 | 2018-10-17 15:05:56 -0700 | [diff] [blame] | 411 | |
| 412 | if existingSource.CRC32() == source.CRC32() && existingSource.Size() == source.Size() { |
| 413 | continue |
| 414 | } |
| 415 | |
| 416 | return fmt.Errorf("Duplicate path %v found in %v and %v\n", |
| 417 | dest, existingSource, source) |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 418 | } |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 419 | } |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 420 | } |
| 421 | |
Colin Cross | 3454031 | 2017-09-06 12:52:37 -0700 | [diff] [blame] | 422 | if emulateJar { |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 423 | jarSort(orderedMappings) |
| 424 | } else if sortEntries { |
| 425 | alphanumericSort(orderedMappings) |
| 426 | } |
| 427 | |
| 428 | for _, entry := range orderedMappings { |
Colin Cross | 635acc9 | 2017-09-12 22:50:46 -0700 | [diff] [blame] | 429 | if err := entry.source.WriteToZip(entry.dest, writer); err != nil { |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 430 | return err |
| 431 | } |
| 432 | } |
| 433 | |
| 434 | return nil |
| 435 | } |
| 436 | |
Nan Zhang | 5925b0f | 2017-12-19 15:13:40 -0800 | [diff] [blame] | 437 | // Sets the given directory and all its ancestor directories as Python packages. |
| 438 | func populateNewPyPkgs(pkgPath string, existingPyPkgSet map[string]bool, newPyPkgs *[]string) { |
| 439 | for pkgPath != "" { |
| 440 | if _, found := existingPyPkgSet[pkgPath]; !found { |
| 441 | existingPyPkgSet[pkgPath] = true |
| 442 | *newPyPkgs = append(*newPyPkgs, pkgPath) |
| 443 | // Gets its ancestor directory by trimming last slash. |
| 444 | pkgPath = pathBeforeLastSlash(pkgPath) |
| 445 | } else { |
| 446 | break |
| 447 | } |
| 448 | } |
| 449 | } |
| 450 | |
| 451 | func pathBeforeLastSlash(path string) string { |
| 452 | ret := filepath.Dir(path) |
| 453 | // filepath.Dir("abc") -> "." and filepath.Dir("/abc") -> "/". |
| 454 | if ret == "." || ret == "/" { |
| 455 | return "" |
| 456 | } |
| 457 | return ret |
| 458 | } |
| 459 | |
Colin Cross | 4c03f68 | 2018-07-15 08:16:31 -0700 | [diff] [blame] | 460 | func shouldStripEntry(emulateJar bool, stripFiles, stripDirs []string, name string) (bool, error) { |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 461 | for _, dir := range stripDirs { |
Colin Cross | 4c03f68 | 2018-07-15 08:16:31 -0700 | [diff] [blame] | 462 | dir = filepath.Clean(dir) |
| 463 | patterns := []string{ |
| 464 | dir + "/", // the directory itself |
| 465 | dir + "/**/*", // files recursively in the directory |
| 466 | dir + "/**/*/", // directories recursively in the directory |
| 467 | } |
| 468 | |
| 469 | for _, pattern := range patterns { |
| 470 | match, err := pathtools.Match(pattern, name) |
| 471 | if err != nil { |
| 472 | return false, fmt.Errorf("%s: %s", err.Error(), pattern) |
| 473 | } else if match { |
| 474 | if emulateJar { |
| 475 | // When merging jar files, don't strip META-INF/MANIFEST.MF even if stripping META-INF is |
| 476 | // requested. |
| 477 | // TODO(ccross): which files does this affect? |
| 478 | if name != jar.MetaDir && name != jar.ManifestFile { |
| 479 | return true, nil |
| 480 | } |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 481 | } |
Colin Cross | 4c03f68 | 2018-07-15 08:16:31 -0700 | [diff] [blame] | 482 | return true, nil |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 483 | } |
| 484 | } |
| 485 | } |
Colin Cross | 4c03f68 | 2018-07-15 08:16:31 -0700 | [diff] [blame] | 486 | |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 487 | for _, pattern := range stripFiles { |
Colin Cross | 4c03f68 | 2018-07-15 08:16:31 -0700 | [diff] [blame] | 488 | if match, err := pathtools.Match(pattern, name); err != nil { |
| 489 | return false, fmt.Errorf("%s: %s", err.Error(), pattern) |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 490 | } else if match { |
Colin Cross | 4c03f68 | 2018-07-15 08:16:31 -0700 | [diff] [blame] | 491 | return true, nil |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 492 | } |
| 493 | } |
Colin Cross | 4c03f68 | 2018-07-15 08:16:31 -0700 | [diff] [blame] | 494 | return false, nil |
Colin Cross | 0cf45cd | 2017-10-04 17:04:16 -0700 | [diff] [blame] | 495 | } |
| 496 | |
Jeff Gaston | 8bab5f2 | 2017-09-01 13:34:28 -0700 | [diff] [blame] | 497 | func jarSort(files []fileMapping) { |
| 498 | sort.SliceStable(files, func(i, j int) bool { |
| 499 | return jar.EntryNamesLess(files[i].dest, files[j].dest) |
| 500 | }) |
| 501 | } |
| 502 | |
| 503 | func alphanumericSort(files []fileMapping) { |
| 504 | sort.SliceStable(files, func(i, j int) bool { |
| 505 | return files[i].dest < files[j].dest |
| 506 | }) |
| 507 | } |