# pylint: disable=g-bad-file-header # Copyright 2017 The Bazel Authors. All rights reserved. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http:#www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. """Utils to the contents of a tar or zip file into another zip file.""" import contextlib import os.path import stat import tarfile import zipfile def is_mode_executable(mode): """Returns true if `mode` has any of the executable bits set.""" return mode & (stat.S_IXUSR | stat.S_IXGRP | stat.S_IXOTH) > 0 def is_executable(path): """Returns true if `path` is an executable file/directory.""" return is_mode_executable(os.stat(path)[stat.ST_MODE]) def copy_tar_to_zip(output_zip, input_file, process_filename=None): """Copy a tar file's contents into a zip file. This function unpacks every file from `input_file` and puts them into `output_zip`. The unpacking is performed in-memory. Args: output_zip: zipfile.ZipFile; the destination archive input_file: string; path to the source tar file process_filename: function(str) -> str; optional; for a packed file entry in `input_file` it computes the path in `output_zip` """ with tarfile.open(input_file, 'r', errorlevel=2) as tar_file: while True: tar_entry = tar_file.next() if tar_entry is None: break filename = (process_filename(tar_entry.name) if process_filename else tar_entry.name) zipinfo = zipfile.ZipInfo(filename, (1980, 1, 1, 0, 0, 0)) if tar_entry.isreg(): if is_mode_executable(tar_entry.mode): zipinfo.external_attr = 0o755 << 16 else: zipinfo.external_attr = 0o644 << 16 zipinfo.compress_type = zipfile.ZIP_DEFLATED output_zip.writestr(zipinfo, tar_file.extractfile(tar_entry).read()) elif tar_entry.issym(): # 0120000 originally comes from the definition of S_IFLNK and # marks a symbolic link in the Zip file format. zipinfo.external_attr = 0o120000 << 16 output_zip.writestr(zipinfo, tar_entry.linkname) else: # Ignore directories, hard links, special files, ... pass def copy_zip_to_zip(output_zip, input_file, process_filename=None): """Copy a zip file's contents into another zip file. This function unpacks every file from `input_file` and puts them into `output_zip`. The unpacking is performed in-memory. Args: output_zip: zipfile.ZipFile; the destination archive input_file: string; path to the source tar file process_filename: function(str) -> str; optional; for a packed file entry in `input_file` it computes the path in `output_zip` """ # Adding contextlib.closing to be python 2.6 (for centos 6.7) compatible with contextlib.closing(zipfile.ZipFile(input_file, 'r')) as zip_file: for zip_entry in zip_file.infolist(): filename = (process_filename(zip_entry.filename) if process_filename else zip_entry.filename) zipinfo = zipfile.ZipInfo(filename, (1980, 1, 1, 0, 0, 0)) if is_mode_executable(zip_entry.external_attr >> 16 & 0xFFFF): zipinfo.external_attr = 0o755 << 16 else: zipinfo.external_attr = 0o644 << 16 zipinfo.compress_type = zip_entry.compress_type output_zip.writestr(zipinfo, zip_file.read(zip_entry))