// Copyright 2015 The Bazel Authors. All rights reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. // // Zip / Unzip file using ijar zip implementation. // // Note that this Zip implementation intentionally don't compute CRC-32 // because it is useless computation for jar because Java doesn't care. // CRC-32 of all files in the zip file will be set to 0. // #include #include #include #include #include #include #include #include #include #include #include #include "third_party/ijar/zip.h" namespace devtools_ijar { #define SYSCALL(expr) do { \ if ((expr) < 0) { \ perror(#expr); \ abort(); \ } \ } while (0) // // A ZipExtractorProcessor that extract files in the ZIP file. // class UnzipProcessor : public ZipExtractorProcessor { public: // Create a processor who will extract the given files (or all files if NULL) // into output_root if "extract" is set to true and will print the list of // files and their unix modes if "verbose" is set to true. UnzipProcessor(const char *output_root, char **files, bool verbose, bool extract) : output_root_(output_root), verbose_(verbose), extract_(extract) { if (files != NULL) { for (int i = 0; files[i] != NULL; i++) { file_names.insert(std::string(files[i])); } } } virtual ~UnzipProcessor() {} virtual void Process(const char* filename, const u4 attr, const u1* data, const size_t size); virtual bool Accept(const char* filename, const u4 attr) { // All entry files are accepted by default. if (file_names.empty()) { return true; } else { // If users have specified file entries, only accept those files. return file_names.count(std::string(filename)) == 1; } } private: const char *output_root_; const bool verbose_; const bool extract_; std::set file_names; }; // Concatene 2 path, path1 and path2, using / as a directory separator and // puting the result in "out". "size" specify the size of the output buffer void concat_path(char* out, const size_t size, const char *path1, const char *path2) { int len1 = strlen(path1); size_t l = len1; strncpy(out, path1, size - 1); out[size-1] = 0; if (l < size - 1 && path1[len1] != '/' && path2[0] != '/') { out[l] = '/'; l++; out[l] = 0; } if (l < size - 1) { strncat(out, path2, size - 1 - l); } } // Do a recursive mkdir of all folders of path except the last path // segment (if path ends with a / then the last path segment is empty). // All folders are created using "mode" for creation mode. void mkdirs(const char *path, mode_t mode) { char path_[PATH_MAX]; struct stat statst; strncpy(path_, path, PATH_MAX); path_[PATH_MAX-1] = 0; char *pointer = path_; while ((pointer = strchr(pointer, '/')) != NULL) { if (path_ != pointer) { // skip leading slash *pointer = 0; if (stat(path_, &statst) != 0) { if (mkdir(path_, mode) < 0) { fprintf(stderr, "Cannot create folder %s: %s\n", path_, strerror(errno)); abort(); } } *pointer = '/'; } pointer++; } } void UnzipProcessor::Process(const char* filename, const u4 attr, const u1* data, const size_t size) { mode_t mode = zipattr_to_mode(attr); mode_t perm = mode & 0777; bool isdir = (mode & S_IFDIR) != 0; if (attr == 0) { // Fallback when the external attribute is not set. isdir = filename[strlen(filename)-1] == '/'; perm = 0777; } if (verbose_) { printf("%c %o %s\n", isdir ? 'd' : 'f', perm, filename); } if (extract_) { char path[PATH_MAX]; int fd; concat_path(path, PATH_MAX, output_root_, filename); // Directories created must have executable bit set and be owner writeable. // Otherwise, we cannot write or create any file inside. mkdirs(path, perm | S_IWUSR | S_IXUSR); if (!isdir) { fd = open(path, O_CREAT | O_WRONLY, perm); if (fd < 0) { fprintf(stderr, "Cannot open file %s for writing: %s\n", path, strerror(errno)); abort(); } SYSCALL(write(fd, data, size)); SYSCALL(close(fd)); } } } // Get the basename of path and store it in output. output_size // is the size of the output buffer. void basename(const char *path, char *output, size_t output_size) { const char *pointer = strrchr(path, '/'); if (pointer == NULL) { pointer = path; } else { pointer++; // Skip the leading slash. } strncpy(output, pointer, output_size); output[output_size-1] = 0; } // copy size bytes from file descriptor fd into buffer. int copy_file_to_buffer(int fd, size_t size, void *buffer) { size_t nb_read = 0; while (nb_read < size) { size_t to_read = size - nb_read; if (to_read > 16384 /* 16K */) { to_read = 16384; } ssize_t r = read(fd, static_cast(buffer) + nb_read, to_read); if (r < 0) { return -1; } nb_read += r; } return 0; } // Execute the extraction (or just listing if just v is provided) int extract(char *zipfile, char* exdir, char **files, bool verbose, bool extract) { char cwd[PATH_MAX]; if (getcwd(cwd, PATH_MAX) == NULL) { fprintf(stderr, "getcwd() failed: %s.\n", strerror(errno)); return -1; } char output_root[PATH_MAX]; if (exdir != NULL) { concat_path(output_root, PATH_MAX, cwd, exdir); } else { strncpy(output_root, cwd, PATH_MAX); } UnzipProcessor processor(output_root, files, verbose, extract); std::unique_ptr extractor(ZipExtractor::Create(zipfile, &processor)); if (extractor.get() == NULL) { fprintf(stderr, "Unable to open zip file %s: %s.\n", zipfile, strerror(errno)); return -1; } if (extractor->ProcessAll() < 0) { fprintf(stderr, "%s.\n", extractor->GetError()); return -1; } return 0; } // add a file to the zip int add_file(std::unique_ptr const &builder, char *file, char *zip_path, bool flatten, bool verbose, bool compress) { struct stat statst; statst.st_size = 0; statst.st_mode = 0666; if (file != NULL) { if (stat(file, &statst) < 0) { fprintf(stderr, "Cannot stat file %s: %s.\n", file, strerror(errno)); return -1; } } char *final_path = zip_path != NULL ? zip_path : file; bool isdir = (statst.st_mode & S_IFDIR) != 0; if (flatten && isdir) { return 0; } // Compute the path, flattening it if requested char path[PATH_MAX]; size_t len = strlen(final_path); if (len > PATH_MAX) { fprintf(stderr, "Path too long: %s.\n", final_path); return -1; } if (flatten) { basename(final_path, path, PATH_MAX); } else { strncpy(path, final_path, PATH_MAX); path[PATH_MAX - 1] = 0; if (isdir && len < PATH_MAX - 1) { // Add the trailing slash for folders path[len] = '/'; path[len + 1] = 0; } } if (verbose) { mode_t perm = statst.st_mode & 0777; printf("%c %o %s\n", isdir ? 'd' : 'f', perm, path); } u1 *buffer = builder->NewFile(path, mode_to_zipattr(statst.st_mode)); if (isdir || statst.st_size == 0) { builder->FinishFile(0); } else { // read the input file int fd = open(file, O_RDONLY); if (fd < 0) { fprintf(stderr, "Can't open file %s for reading: %s.\n", file, strerror(errno)); return -1; } if (copy_file_to_buffer(fd, statst.st_size, buffer) < 0) { fprintf(stderr, "Can't read file %s: %s.\n", file, strerror(errno)); close(fd); return -1; } close(fd); builder->FinishFile(statst.st_size, compress, true); } return 0; } // Read a list of files separated by newlines. The resulting array can be // freed using the free method. char **read_filelist(char *filename) { struct stat statst; int fd = open(filename, O_RDONLY); if (fd < 0) { fprintf(stderr, "Can't open file %s for reading: %s.\n", filename, strerror(errno)); return NULL; } if (fstat(fd, &statst) < 0) { fprintf(stderr, "Cannot stat file %s: %s.\n", filename, strerror(errno)); return NULL; } char *data = static_cast(malloc(statst.st_size)); if (copy_file_to_buffer(fd, statst.st_size, data) < 0) { fprintf(stderr, "Can't read file %s: %s.\n", filename, strerror(errno)); close(fd); return NULL; } close(fd); int nb_entries = 1; for (int i = 0; i < statst.st_size; i++) { if (data[i] == '\n') { nb_entries++; } } size_t sizeof_array = sizeof(char *) * (nb_entries + 1); void *result = malloc(sizeof_array + statst.st_size); // copy the content char **filelist = static_cast(result); char *content = static_cast(result) + sizeof_array; memcpy(content, data, statst.st_size); free(data); // Create the corresponding array int j = 1; filelist[0] = content; for (int i = 0; i < statst.st_size; i++) { if (content[i] == '\n') { content[i] = 0; if (i + 1 < statst.st_size) { filelist[j] = content + i + 1; j++; } } } filelist[j] = NULL; return filelist; } // return real paths of the files char **parse_filelist(char *zipfile, char **file_entries, int nb_entries, bool flatten) { // no need to free since the path lists should live until the end of the // program char **files = static_cast(malloc(sizeof(char *) * nb_entries)); char **zip_paths = file_entries; for (int i = 0; i < nb_entries; i++) { char *p_eq = strchr(file_entries[i], '='); if (p_eq != NULL) { if (flatten) { fprintf(stderr, "Unable to create zip file %s: %s.\n", zipfile, "= can't be used with flatten"); free(files); return NULL; } if (p_eq == file_entries[i]) { fprintf(stderr, "Unable to create zip file %s: %s.\n", zipfile, "A zip path should be given before ="); free(files); return NULL; } *p_eq = '\0'; files[i] = p_eq + 1; if (files[i][0] == '\0') { files[i] = NULL; } } else { files[i] = file_entries[i]; zip_paths[i] = NULL; } } return files; } // Execute the create operation int create(char *zipfile, char **file_entries, bool flatten, bool verbose, bool compress) { int nb_entries = 0; while (file_entries[nb_entries] != NULL) { nb_entries++; } char **zip_paths = file_entries; char **files = parse_filelist(zipfile, file_entries, nb_entries, flatten); if (files == NULL) { return -1; } u8 size = ZipBuilder::EstimateSize(files, zip_paths, nb_entries); if (size == 0) { return -1; } std::unique_ptr builder(ZipBuilder::Create(zipfile, size)); if (builder.get() == NULL) { fprintf(stderr, "Unable to create zip file %s: %s.\n", zipfile, strerror(errno)); return -1; } for (int i = 0; i < nb_entries; i++) { if (add_file(builder, files[i], zip_paths[i], flatten, verbose, compress) < 0) { return -1; } } if (builder->Finish() < 0) { fprintf(stderr, "%s\n", builder->GetError()); return -1; } return 0; } } // namespace devtools_ijar // // main method // static void usage(char *progname) { fprintf(stderr, "Usage: %s [vxc[fC]] x.zip [-d exdir] [[zip_path1=]file1 ... " "[zip_pathn=]filen]\n", progname); fprintf(stderr, " v verbose - list all file in x.zip\n"); fprintf(stderr, " x extract - extract files in x.zip to current directory, or " " an optional directory relative to the current directory " " specified through -d option\n"); fprintf(stderr, " c create - add files to x.zip\n"); fprintf(stderr, " f flatten - flatten files to use with create operation\n"); fprintf(stderr, " C compress - compress files when using the create operation\n"); fprintf(stderr, "x and c cannot be used in the same command-line.\n"); fprintf(stderr, "\nFor every file, a path in the zip can be specified. Examples:\n"); fprintf(stderr, " zipper c x.zip a/b/__init__.py= # Add an empty file at " "a/b/__init__.py\n"); fprintf(stderr, " zipper c x.zip a/b/main.py=foo/bar/bin.py # Add file " "foo/bar/bin.py at a/b/main.py\n"); fprintf(stderr, "\nIf the zip path is not specified, it is assumed to be the file " "path.\n"); exit(1); } int main(int argc, char **argv) { bool extract = false; bool verbose = false; bool create = false; bool compress = false; bool flatten = false; if (argc < 3) { usage(argv[0]); } for (int i = 0; argv[1][i] != 0; i++) { switch (argv[1][i]) { case 'x': extract = true; break; case 'v': verbose = true; break; case 'c': create = true; break; case 'f': flatten = true; break; case 'C': compress = true; break; default: usage(argv[0]); } } // x and c cannot be used in the same command-line. if (create && extract) { usage(argv[0]); } // Calculate the argument index of the first entry file. int filelist_start_index; if (argc > 3 && strcmp(argv[3], "-d") == 0) { filelist_start_index = 5; } else { filelist_start_index = 3; } char** filelist = NULL; // We have one option file. Read and extract the content. if (argc == filelist_start_index + 1 && argv[filelist_start_index][0] == '@') { char* filelist_name = argv[filelist_start_index]; filelist = devtools_ijar::read_filelist(filelist_name + 1); if (filelist == NULL) { fprintf(stderr, "Can't read file list %s: %s.\n", filelist_name, strerror(errno)); return -1; } // We have more than one files. Assume that they are all file entries. } else if (argc >= filelist_start_index + 1) { filelist = argv + filelist_start_index; } else { // There are no entry files specified. This is forbidden if we are creating // a zip file. if (create) { fprintf(stderr, "Can't create zip without input files specified."); return -1; } } if (create) { // Create a zip return devtools_ijar::create(argv[2], filelist, flatten, verbose, compress); } else { if (flatten) { usage(argv[0]); } char* exdir = NULL; if (argc > 3 && strcmp(argv[3], "-d") == 0) { exdir = argv[4]; } // Extraction / list mode return devtools_ijar::extract(argv[2], exdir, filelist, verbose, extract); } }