shuit模块

#高级的 文件、文件夹、压缩包 处理模块

shutil.copyfileobj(fsrc, fdst[, length])
将文件内容拷贝到另一个文件中,可以部分内容

def copyfile(src, dst):
"""Copy data from src to dst"""
if _samefile(src, dst):
raise Error("`%s` and `%s` are the same file" % (src, dst)) for fn in [src, dst]:
try:
st = os.stat(fn)
except OSError:
# File most likely does not exist
pass
else:
# XXX What about other special files? (sockets, devices...)
if stat.S_ISFIFO(st.st_mode):
raise SpecialFileError("`%s` is a named pipe" % fn) with open(src, 'rb') as fsrc:
with open(dst, 'wb') as fdst:
copyfileobj(fsrc, fdst)
 
shutil.move('/build/executables', 'installdir')      # 移动文件或目录 
 
shutil.copymode(src, dst)
仅拷贝权限。内容、组、用户均不变
def copymode(src, dst):
"""Copy mode bits from src to dst"""
if hasattr(os, 'chmod'):
st = os.stat(src)
mode = stat.S_IMODE(st.st_mode)
os.chmod(dst, mode)

shutil.copystat(src, dst)
拷贝状态的信息,包括:mode bits, atime, mtime, flags

def copystat(src, dst):
"""Copy all stat info (mode bits, atime, mtime, flags) from src to dst"""
st = os.stat(src)
mode = stat.S_IMODE(st.st_mode)
if hasattr(os, 'utime'):
os.utime(dst, (st.st_atime, st.st_mtime))
if hasattr(os, 'chmod'):
os.chmod(dst, mode)
if hasattr(os, 'chflags') and hasattr(st, 'st_flags'):
try:
os.chflags(dst, st.st_flags)
except OSError, why:
for err in 'EOPNOTSUPP', 'ENOTSUP':
if hasattr(errno, err) and why.errno == getattr(errno, err):
break
else:
raise

shutil.copy(src, dst)
拷贝文件和权限

def copy(src, dst):
"""Copy data and mode bits ("cp src dst"). The destination may be a directory. """
if os.path.isdir(dst):
dst = os.path.join(dst, os.path.basename(src))
copyfile(src, dst)
copymode(src, dst)

shutil.copy2(src, dst)
拷贝文件和状态信息

def copy2(src, dst):
"""Copy data and all stat info ("cp -p src dst"). The destination may be a directory. """
if os.path.isdir(dst):
dst = os.path.join(dst, os.path.basename(src))
copyfile(src, dst)
copystat(src, dst)

shutil.ignore_patterns(*patterns)
shutil.copytree(src, dst, symlinks=False, ignore=None)
递归的去拷贝文件

例如:copytree(source, destination, ignore=ignore_patterns('*.pyc', 'tmp*'))

def ignore_patterns(*patterns):
"""Function that can be used as copytree() ignore parameter. Patterns is a sequence of glob-style patterns
that are used to exclude files"""
def _ignore_patterns(path, names):
ignored_names = []
for pattern in patterns:
ignored_names.extend(fnmatch.filter(names, pattern))
return set(ignored_names)
return _ignore_patterns def copytree(src, dst, symlinks=False, ignore=None):
"""Recursively copy a directory tree using copy2(). The destination directory must not already exist.
If exception(s) occur, an Error is raised with a list of reasons. If the optional symlinks flag is true, symbolic links in the
source tree result in symbolic links in the destination tree; if
it is false, the contents of the files pointed to by symbolic
links are copied. The optional ignore argument is a callable. If given, it
is called with the `src` parameter, which is the directory
being visited by copytree(), and `names` which is the list of
`src` contents, as returned by os.listdir(): callable(src, names) -> ignored_names Since copytree() is called recursively, the callable will be
called once for each directory that is copied. It returns a
list of names relative to the `src` directory that should
not be copied. XXX Consider this example code rather than the ultimate tool. """
names = os.listdir(src)
if ignore is not None:
ignored_names = ignore(src, names)
else:
ignored_names = set() os.makedirs(dst)
errors = []
for name in names:
if name in ignored_names:
continue
srcname = os.path.join(src, name)
dstname = os.path.join(dst, name)
try:
if symlinks and os.path.islink(srcname):
linkto = os.readlink(srcname)
os.symlink(linkto, dstname)
elif os.path.isdir(srcname):
copytree(srcname, dstname, symlinks, ignore)
else:
# Will raise a SpecialFileError for unsupported file types
copy2(srcname, dstname)
# catch the Error from the recursive copytree so that we can
# continue with other files
except Error, err:
errors.extend(err.args[0])
except EnvironmentError, why:
errors.append((srcname, dstname, str(why)))
try:
copystat(src, dst)
except OSError, why:
if WindowsError is not None and isinstance(why, WindowsError):
# Copying file access times may fail on Windows
pass
else:
errors.append((src, dst, str(why)))
if errors:
raise Error, errors

shutil.rmtree(path[, ignore_errors[, onerror]])
递归的去删除文件

def rmtree(path, ignore_errors=False, onerror=None):
"""Recursively delete a directory tree. If ignore_errors is set, errors are ignored; otherwise, if onerror
is set, it is called to handle the error with arguments (func,
path, exc_info) where func is os.listdir, os.remove, or os.rmdir;
path is the argument to that function that caused it to fail; and
exc_info is a tuple returned by sys.exc_info(). If ignore_errors
is false and onerror is None, an exception is raised. """
if ignore_errors:
def onerror(*args):
pass
elif onerror is None:
def onerror(*args):
raise
try:
if os.path.islink(path):
# symlinks to directories are forbidden, see bug #1669
raise OSError("Cannot call rmtree on a symbolic link")
except OSError:
onerror(os.path.islink, path, sys.exc_info())
# can't continue even if onerror hook returns
return
names = []
try:
names = os.listdir(path)
except os.error, err:
onerror(os.listdir, path, sys.exc_info())
for name in names:
fullname = os.path.join(path, name)
try:
mode = os.lstat(fullname).st_mode
except os.error:
mode = 0
if stat.S_ISDIR(mode):
rmtree(fullname, ignore_errors, onerror)
else:
try:
os.remove(fullname)
except os.error, err:
onerror(os.remove, fullname, sys.exc_info())
try:
os.rmdir(path)
except os.error:
onerror(os.rmdir, path, sys.exc_info())

shutil.move(src, dst)
递归的去移动文件

def move(src, dst):
"""Recursively move a file or directory to another location. This is
similar to the Unix "mv" command. If the destination is a directory or a symlink to a directory, the source
is moved inside the directory. The destination path must not already
exist. If the destination already exists but is not a directory, it may be
overwritten depending on os.rename() semantics. If the destination is on our current filesystem, then rename() is used.
Otherwise, src is copied to the destination and then removed.
A lot more could be done here... A look at a mv.c shows a lot of
the issues this implementation glosses over. """
real_dst = dst
if os.path.isdir(dst):
if _samefile(src, dst):
# We might be on a case insensitive filesystem,
# perform the rename anyway.
os.rename(src, dst)
return real_dst = os.path.join(dst, _basename(src))
if os.path.exists(real_dst):
raise Error, "Destination path '%s' already exists" % real_dst
try:
os.rename(src, real_dst)
except OSError:
if os.path.isdir(src):
if _destinsrc(src, dst):
raise Error, "Cannot move a directory '%s' into itself '%s'." % (src, dst)
copytree(src, real_dst, symlinks=True)
rmtree(src)
else:
copy2(src, real_dst)
os.unlink(src)

shutil.make_archive(base_name, format,...)

创建压缩包并返回文件路径,例如:zip、tar

    • base_name: 压缩包的文件名,也可以是压缩包的路径。只是文件名时,则保存至当前目录,否则保存至指定路径,
      如:www                        =>保存至当前路径
      如:/Users/wupeiqi/www =>保存至/Users/wupeiqi/
    • format: 压缩包种类,“zip”, “tar”, “bztar”,“gztar”
    • root_dir: 要压缩的文件夹路径(默认当前目录)
    • owner: 用户,默认当前用户
    • group: 组,默认当前组
    • logger: 用于记录日志,通常是logging.Logger对象
    • #将 /Users/wupeiqi/Downloads/test 下的文件打包放置当前程序目录
      
      import shutil
      ret = shutil.make_archive("wwwwwwwwww", 'gztar', root_dir='/Users/wupeiqi/Downloads/test') #将 /Users/wupeiqi/Downloads/test 下的文件打包放置 /Users/wupeiqi/目录
      import shutil
      ret = shutil.make_archive("/Users/wupeiqi/wwwwwwwwww", 'gztar', root_dir='/Users/wupeiqi/Downloads/test')
      def make_archive(base_name, format, root_dir=None, base_dir=None, verbose=0,
      dry_run=0, owner=None, group=None, logger=None):
      """Create an archive file (eg. zip or tar). 'base_name' is the name of the file to create, minus any format-specific
      extension; 'format' is the archive format: one of "zip", "tar", "bztar"
      or "gztar". 'root_dir' is a directory that will be the root directory of the
      archive; ie. we typically chdir into 'root_dir' before creating the
      archive. 'base_dir' is the directory where we start archiving from;
      ie. 'base_dir' will be the common prefix of all files and
      directories in the archive. 'root_dir' and 'base_dir' both default
      to the current directory. Returns the name of the archive file. 'owner' and 'group' are used when creating a tar archive. By default,
      uses the current owner and group.
      """
      save_cwd = os.getcwd()
      if root_dir is not None:
      if logger is not None:
      logger.debug("changing into '%s'", root_dir)
      base_name = os.path.abspath(base_name)
      if not dry_run:
      os.chdir(root_dir) if base_dir is None:
      base_dir = os.curdir kwargs = {'dry_run': dry_run, 'logger': logger} try:
      format_info = _ARCHIVE_FORMATS[format]
      except KeyError:
      raise ValueError, "unknown archive format '%s'" % format func = format_info[0]
      for arg, val in format_info[1]:
      kwargs[arg] = val if format != 'zip':
      kwargs['owner'] = owner
      kwargs['group'] = group try:
      filename = func(base_name, base_dir, **kwargs)
      finally:
      if root_dir is not None:
      if logger is not None:
      logger.debug("changing back to '%s'", save_cwd)
      os.chdir(save_cwd) rCtrleturn filename

      shutil 对压缩包的处理是调用 ZipFile 和 TarFile 两个模块来进行的,详细

    • import zipfile
      
      # 压缩
      z = zipfile.ZipFile('laxi.zip', 'w')
      z.write('a.log')
      z.write('data.data')
      z.close() # 解压
      z = zipfile.ZipFile('laxi.zip', 'r')
      z.extractall()
      z.close() zipfile 压缩解压

      zipfile 压缩解压

      import tarfile
      
      # 压缩
      tar = tarfile.open('your.tar','w')
      tar.add('/Users/wupeiqi/PycharmProjects/bbs2.zip', arcname='bbs2.zip')
      tar.add('/Users/wupeiqi/PycharmProjects/cmdb.zip', arcname='cmdb.zip')
      tar.close() # 解压
      tar = tarfile.open('your.tar','r')
      tar.extractall() # 可设置解压地址
      tar.close() tarfile 压缩解压

      tarfile 压缩解压

      class ZipFile(object):
      """ Class with methods to open, read, write, close, list zip files. z = ZipFile(file, mode="r", compression=ZIP_STORED, allowZip64=False) file: Either the path to the file, or a file-like object.
      If it is a path, the file will be opened and closed by ZipFile.
      mode: The mode can be either read "r", write "w" or append "a".
      compression: ZIP_STORED (no compression) or ZIP_DEFLATED (requires zlib).
      allowZip64: if True ZipFile will create files with ZIP64 extensions when
      needed, otherwise it will raise an exception when this would
      be necessary. """ fp = None # Set here since __del__ checks it def __init__(self, file, mode="r", compression=ZIP_STORED, allowZip64=False):
      """Open the ZIP file with mode read "r", write "w" or append "a"."""
      if mode not in ("r", "w", "a"):
      raise RuntimeError('ZipFile() requires mode "r", "w", or "a"') if compression == ZIP_STORED:
      pass
      elif compression == ZIP_DEFLATED:
      if not zlib:
      raise RuntimeError,\
      "Compression requires the (missing) zlib module"
      else:
      raise RuntimeError, "That compression method is not supported" self._allowZip64 = allowZip64
      self._didModify = False
      self.debug = 0 # Level of printing: 0 through 3
      self.NameToInfo = {} # Find file info given name
      self.filelist = [] # List of ZipInfo instances for archive
      self.compression = compression # Method of compression
      self.mode = key = mode.replace('b', '')[0]
      self.pwd = None
      self._comment = '' # Check if we were passed a file-like object
      if isinstance(file, basestring):
      self._filePassed = 0
      self.filename = file
      modeDict = {'r' : 'rb', 'w': 'wb', 'a' : 'r+b'}
      try:
      self.fp = open(file, modeDict[mode])
      except IOError:
      if mode == 'a':
      mode = key = 'w'
      self.fp = open(file, modeDict[mode])
      else:
      raise
      else:
      self._filePassed = 1
      self.fp = file
      self.filename = getattr(file, 'name', None) try:
      if key == 'r':
      self._RealGetContents()
      elif key == 'w':
      # set the modified flag so central directory gets written
      # even if no files are added to the archive
      self._didModify = True
      elif key == 'a':
      try:
      # See if file is a zip file
      self._RealGetContents()
      # seek to start of directory and overwrite
      self.fp.seek(self.start_dir, 0)
      except BadZipfile:
      # file is not a zip file, just append
      self.fp.seek(0, 2) # set the modified flag so central directory gets written
      # even if no files are added to the archive
      self._didModify = True
      else:
      raise RuntimeError('Mode must be "r", "w" or "a"')
      except:
      fp = self.fp
      self.fp = None
      if not self._filePassed:
      fp.close()
      raise def __enter__(self):
      return self def __exit__(self, type, value, traceback):
      self.close() def _RealGetContents(self):
      """Read in the table of contents for the ZIP file."""
      fp = self.fp
      try:
      endrec = _EndRecData(fp)
      except IOError:
      raise BadZipfile("File is not a zip file")
      if not endrec:
      raise BadZipfile, "File is not a zip file"
      if self.debug > 1:
      print endrec
      size_cd = endrec[_ECD_SIZE] # bytes in central directory
      offset_cd = endrec[_ECD_OFFSET] # offset of central directory
      self._comment = endrec[_ECD_COMMENT] # archive comment # "concat" is zero, unless zip was concatenated to another file
      concat = endrec[_ECD_LOCATION] - size_cd - offset_cd
      if endrec[_ECD_SIGNATURE] == stringEndArchive64:
      # If Zip64 extension structures are present, account for them
      concat -= (sizeEndCentDir64 + sizeEndCentDir64Locator) if self.debug > 2:
      inferred = concat + offset_cd
      print "given, inferred, offset", offset_cd, inferred, concat
      # self.start_dir: Position of start of central directory
      self.start_dir = offset_cd + concat
      fp.seek(self.start_dir, 0)
      data = fp.read(size_cd)
      fp = cStringIO.StringIO(data)
      total = 0
      while total < size_cd:
      centdir = fp.read(sizeCentralDir)
      if len(centdir) != sizeCentralDir:
      raise BadZipfile("Truncated central directory")
      centdir = struct.unpack(structCentralDir, centdir)
      if centdir[_CD_SIGNATURE] != stringCentralDir:
      raise BadZipfile("Bad magic number for central directory")
      if self.debug > 2:
      print centdir
      filename = fp.read(centdir[_CD_FILENAME_LENGTH])
      # Create ZipInfo instance to store file information
      x = ZipInfo(filename)
      x.extra = fp.read(centdir[_CD_EXTRA_FIELD_LENGTH])
      x.comment = fp.read(centdir[_CD_COMMENT_LENGTH])
      x.header_offset = centdir[_CD_LOCAL_HEADER_OFFSET]
      (x.create_version, x.create_system, x.extract_version, x.reserved,
      x.flag_bits, x.compress_type, t, d,
      x.CRC, x.compress_size, x.file_size) = centdir[1:12]
      x.volume, x.internal_attr, x.external_attr = centdir[15:18]
      # Convert date/time code to (year, month, day, hour, min, sec)
      x._raw_time = t
      x.date_time = ( (d>>9)+1980, (d>>5)&0xF, d&0x1F,
      t>>11, (t>>5)&0x3F, (t&0x1F) * 2 ) x._decodeExtra()
      x.header_offset = x.header_offset + concat
      x.filename = x._decodeFilename()
      self.filelist.append(x)
      self.NameToInfo[x.filename] = x # update total bytes read from central directory
      total = (total + sizeCentralDir + centdir[_CD_FILENAME_LENGTH]
      + centdir[_CD_EXTRA_FIELD_LENGTH]
      + centdir[_CD_COMMENT_LENGTH]) if self.debug > 2:
      print "total", total def namelist(self):
      """Return a list of file names in the archive."""
      l = []
      for data in self.filelist:
      l.append(data.filename)
      return l def infolist(self):
      """Return a list of class ZipInfo instances for files in the
      archive."""
      return self.filelist def printdir(self):
      """Print a table of contents for the zip file."""
      print "%-46s %19s %12s" % ("File Name", "Modified ", "Size")
      for zinfo in self.filelist:
      date = "%d-%02d-%02d %02d:%02d:%02d" % zinfo.date_time[:6]
      print "%-46s %s %12d" % (zinfo.filename, date, zinfo.file_size) def testzip(self):
      """Read all the files and check the CRC."""
      chunk_size = 2 ** 20
      for zinfo in self.filelist:
      try:
      # Read by chunks, to avoid an OverflowError or a
      # MemoryError with very large embedded files.
      with self.open(zinfo.filename, "r") as f:
      while f.read(chunk_size): # Check CRC-32
      pass
      except BadZipfile:
      return zinfo.filename def getinfo(self, name):
      """Return the instance of ZipInfo given 'name'."""
      info = self.NameToInfo.get(name)
      if info is None:
      raise KeyError(
      'There is no item named %r in the archive' % name) return info def setpassword(self, pwd):
      """Set default password for encrypted files."""
      self.pwd = pwd @property
      def comment(self):
      """The comment text associated with the ZIP file."""
      return self._comment @comment.setter
      def comment(self, comment):
      # check for valid comment length
      if len(comment) > ZIP_MAX_COMMENT:
      import warnings
      warnings.warn('Archive comment is too long; truncating to %d bytes'
      % ZIP_MAX_COMMENT, stacklevel=2)
      comment = comment[:ZIP_MAX_COMMENT]
      self._comment = comment
      self._didModify = True def read(self, name, pwd=None):
      """Return file bytes (as a string) for name."""
      return self.open(name, "r", pwd).read() def open(self, name, mode="r", pwd=None):
      """Return file-like object for 'name'."""
      if mode not in ("r", "U", "rU"):
      raise RuntimeError, 'open() requires mode "r", "U", or "rU"'
      if not self.fp:
      raise RuntimeError, \
      "Attempt to read ZIP archive that was already closed" # Only open a new file for instances where we were not
      # given a file object in the constructor
      if self._filePassed:
      zef_file = self.fp
      should_close = False
      else:
      zef_file = open(self.filename, 'rb')
      should_close = True try:
      # Make sure we have an info object
      if isinstance(name, ZipInfo):
      # 'name' is already an info object
      zinfo = name
      else:
      # Get info object for name
      zinfo = self.getinfo(name) zef_file.seek(zinfo.header_offset, 0) # Skip the file header:
      fheader = zef_file.read(sizeFileHeader)
      if len(fheader) != sizeFileHeader:
      raise BadZipfile("Truncated file header")
      fheader = struct.unpack(structFileHeader, fheader)
      if fheader[_FH_SIGNATURE] != stringFileHeader:
      raise BadZipfile("Bad magic number for file header") fname = zef_file.read(fheader[_FH_FILENAME_LENGTH])
      if fheader[_FH_EXTRA_FIELD_LENGTH]:
      zef_file.read(fheader[_FH_EXTRA_FIELD_LENGTH]) if fname != zinfo.orig_filename:
      raise BadZipfile, \
      'File name in directory "%s" and header "%s" differ.' % (
      zinfo.orig_filename, fname) # check for encrypted flag & handle password
      is_encrypted = zinfo.flag_bits & 0x1
      zd = None
      if is_encrypted:
      if not pwd:
      pwd = self.pwd
      if not pwd:
      raise RuntimeError, "File %s is encrypted, " \
      "password required for extraction" % name zd = _ZipDecrypter(pwd)
      # The first 12 bytes in the cypher stream is an encryption header
      # used to strengthen the algorithm. The first 11 bytes are
      # completely random, while the 12th contains the MSB of the CRC,
      # or the MSB of the file time depending on the header type
      # and is used to check the correctness of the password.
      bytes = zef_file.read(12)
      h = map(zd, bytes[0:12])
      if zinfo.flag_bits & 0x8:
      # compare against the file type from extended local headers
      check_byte = (zinfo._raw_time >> 8) & 0xff
      else:
      # compare against the CRC otherwise
      check_byte = (zinfo.CRC >> 24) & 0xff
      if ord(h[11]) != check_byte:
      raise RuntimeError("Bad password for file", name) return ZipExtFile(zef_file, mode, zinfo, zd,
      close_fileobj=should_close)
      except:
      if should_close:
      zef_file.close()
      raise def extract(self, member, path=None, pwd=None):
      """Extract a member from the archive to the current working directory,
      using its full name. Its file information is extracted as accurately
      as possible. `member' may be a filename or a ZipInfo object. You can
      specify a different directory using `path'.
      """
      if not isinstance(member, ZipInfo):
      member = self.getinfo(member) if path is None:
      path = os.getcwd() return self._extract_member(member, path, pwd) def extractall(self, path=None, members=None, pwd=None):
      """Extract all members from the archive to the current working
      directory. `path' specifies a different directory to extract to.
      `members' is optional and must be a subset of the list returned
      by namelist().
      """
      if members is None:
      members = self.namelist() for zipinfo in members:
      self.extract(zipinfo, path, pwd) def _extract_member(self, member, targetpath, pwd):
      """Extract the ZipInfo object 'member' to a physical
      file on the path targetpath.
      """
      # build the destination pathname, replacing
      # forward slashes to platform specific separators.
      arcname = member.filename.replace('/', os.path.sep) if os.path.altsep:
      arcname = arcname.replace(os.path.altsep, os.path.sep)
      # interpret absolute pathname as relative, remove drive letter or
      # UNC path, redundant separators, "." and ".." components.
      arcname = os.path.splitdrive(arcname)[1]
      arcname = os.path.sep.join(x for x in arcname.split(os.path.sep)
      if x not in ('', os.path.curdir, os.path.pardir))
      if os.path.sep == '\\':
      # filter illegal characters on Windows
      illegal = ':<>|"?*'
      if isinstance(arcname, unicode):
      table = {ord(c): ord('_') for c in illegal}
      else:
      table = string.maketrans(illegal, '_' * len(illegal))
      arcname = arcname.translate(table)
      # remove trailing dots
      arcname = (x.rstrip('.') for x in arcname.split(os.path.sep))
      arcname = os.path.sep.join(x for x in arcname if x) targetpath = os.path.join(targetpath, arcname)
      targetpath = os.path.normpath(targetpath) # Create all upper directories if necessary.
      upperdirs = os.path.dirname(targetpath)
      if upperdirs and not os.path.exists(upperdirs):
      os.makedirs(upperdirs) if member.filename[-1] == '/':
      if not os.path.isdir(targetpath):
      os.mkdir(targetpath)
      return targetpath with self.open(member, pwd=pwd) as source, \
      file(targetpath, "wb") as target:
      shutil.copyfileobj(source, target) return targetpath def _writecheck(self, zinfo):
      """Check for errors before writing a file to the archive."""
      if zinfo.filename in self.NameToInfo:
      import warnings
      warnings.warn('Duplicate name: %r' % zinfo.filename, stacklevel=3)
      if self.mode not in ("w", "a"):
      raise RuntimeError, 'write() requires mode "w" or "a"'
      if not self.fp:
      raise RuntimeError, \
      "Attempt to write ZIP archive that was already closed"
      if zinfo.compress_type == ZIP_DEFLATED and not zlib:
      raise RuntimeError, \
      "Compression requires the (missing) zlib module"
      if zinfo.compress_type not in (ZIP_STORED, ZIP_DEFLATED):
      raise RuntimeError, \
      "That compression method is not supported"
      if not self._allowZip64:
      requires_zip64 = None
      if len(self.filelist) >= ZIP_FILECOUNT_LIMIT:
      requires_zip64 = "Files count"
      elif zinfo.file_size > ZIP64_LIMIT:
      requires_zip64 = "Filesize"
      elif zinfo.header_offset > ZIP64_LIMIT:
      requires_zip64 = "Zipfile size"
      if requires_zip64:
      raise LargeZipFile(requires_zip64 +
      " would require ZIP64 extensions") def write(self, filename, arcname=None, compress_type=None):
      """Put the bytes from filename into the archive under the name
      arcname."""
      if not self.fp:
      raise RuntimeError(
      "Attempt to write to ZIP archive that was already closed") st = os.stat(filename)
      isdir = stat.S_ISDIR(st.st_mode)
      mtime = time.localtime(st.st_mtime)
      date_time = mtime[0:6]
      # Create ZipInfo instance to store file information
      if arcname is None:
      arcname = filename
      arcname = os.path.normpath(os.path.splitdrive(arcname)[1])
      while arcname[0] in (os.sep, os.altsep):
      arcname = arcname[1:]
      if isdir:
      arcname += '/'
      zinfo = ZipInfo(arcname, date_time)
      zinfo.external_attr = (st[0] & 0xFFFF) << 16L # Unix attributes
      if compress_type is None:
      zinfo.compress_type = self.compression
      else:
      zinfo.compress_type = compress_type zinfo.file_size = st.st_size
      zinfo.flag_bits = 0x00
      zinfo.header_offset = self.fp.tell() # Start of header bytes self._writecheck(zinfo)
      self._didModify = True if isdir:
      zinfo.file_size = 0
      zinfo.compress_size = 0
      zinfo.CRC = 0
      zinfo.external_attr |= 0x10 # MS-DOS directory flag
      self.filelist.append(zinfo)
      self.NameToInfo[zinfo.filename] = zinfo
      self.fp.write(zinfo.FileHeader(False))
      return with open(filename, "rb") as fp:
      # Must overwrite CRC and sizes with correct data later
      zinfo.CRC = CRC = 0
      zinfo.compress_size = compress_size = 0
      # Compressed size can be larger than uncompressed size
      zip64 = self._allowZip64 and \
      zinfo.file_size * 1.05 > ZIP64_LIMIT
      self.fp.write(zinfo.FileHeader(zip64))
      if zinfo.compress_type == ZIP_DEFLATED:
      cmpr = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION,
      zlib.DEFLATED, -15)
      else:
      cmpr = None
      file_size = 0
      while 1:
      buf = fp.read(1024 * 8)
      if not buf:
      break
      file_size = file_size + len(buf)
      CRC = crc32(buf, CRC) & 0xffffffff
      if cmpr:
      buf = cmpr.compress(buf)
      compress_size = compress_size + len(buf)
      self.fp.write(buf)
      if cmpr:
      buf = cmpr.flush()
      compress_size = compress_size + len(buf)
      self.fp.write(buf)
      zinfo.compress_size = compress_size
      else:
      zinfo.compress_size = file_size
      zinfo.CRC = CRC
      zinfo.file_size = file_size
      if not zip64 and self._allowZip64:
      if file_size > ZIP64_LIMIT:
      raise RuntimeError('File size has increased during compressing')
      if compress_size > ZIP64_LIMIT:
      raise RuntimeError('Compressed size larger than uncompressed size')
      # Seek backwards and write file header (which will now include
      # correct CRC and file sizes)
      position = self.fp.tell() # Preserve current position in file
      self.fp.seek(zinfo.header_offset, 0)
      self.fp.write(zinfo.FileHeader(zip64))
      self.fp.seek(position, 0)
      self.filelist.append(zinfo)
      self.NameToInfo[zinfo.filename] = zinfo def writestr(self, zinfo_or_arcname, bytes, compress_type=None):
      """Write a file into the archive. The contents is the string
      'bytes'. 'zinfo_or_arcname' is either a ZipInfo instance or
      the name of the file in the archive."""
      if not isinstance(zinfo_or_arcname, ZipInfo):
      zinfo = ZipInfo(filename=zinfo_or_arcname,
      date_time=time.localtime(time.time())[:6]) zinfo.compress_type = self.compression
      if zinfo.filename[-1] == '/':
      zinfo.external_attr = 0o40775 << 16 # drwxrwxr-x
      zinfo.external_attr |= 0x10 # MS-DOS directory flag
      else:
      zinfo.external_attr = 0o600 << 16 # ?rw-------
      else:
      zinfo = zinfo_or_arcname if not self.fp:
      raise RuntimeError(
      "Attempt to write to ZIP archive that was already closed") if compress_type is not None:
      zinfo.compress_type = compress_type zinfo.file_size = len(bytes) # Uncompressed size
      zinfo.header_offset = self.fp.tell() # Start of header bytes
      self._writecheck(zinfo)
      self._didModify = True
      zinfo.CRC = crc32(bytes) & 0xffffffff # CRC-32 checksum
      if zinfo.compress_type == ZIP_DEFLATED:
      co = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION,
      zlib.DEFLATED, -15)
      bytes = co.compress(bytes) + co.flush()
      zinfo.compress_size = len(bytes) # Compressed size
      else:
      zinfo.compress_size = zinfo.file_size
      zip64 = zinfo.file_size > ZIP64_LIMIT or \
      zinfo.compress_size > ZIP64_LIMIT
      if zip64 and not self._allowZip64:
      raise LargeZipFile("Filesize would require ZIP64 extensions")
      self.fp.write(zinfo.FileHeader(zip64))
      self.fp.write(bytes)
      if zinfo.flag_bits & 0x08:
      # Write CRC and file sizes after the file data
      fmt = '<LQQ' if zip64 else '<LLL'
      self.fp.write(struct.pack(fmt, zinfo.CRC, zinfo.compress_size,
      zinfo.file_size))
      self.fp.flush()
      self.filelist.append(zinfo)
      self.NameToInfo[zinfo.filename] = zinfo def __del__(self):
      """Call the "close()" method in case the user forgot."""
      self.close() def close(self):
      """Close the file, and for mode "w" and "a" write the ending
      records."""
      if self.fp is None:
      return try:
      if self.mode in ("w", "a") and self._didModify: # write ending records
      pos1 = self.fp.tell()
      for zinfo in self.filelist: # write central directory
      dt = zinfo.date_time
      dosdate = (dt[0] - 1980) << 9 | dt[1] << 5 | dt[2]
      dostime = dt[3] << 11 | dt[4] << 5 | (dt[5] // 2)
      extra = []
      if zinfo.file_size > ZIP64_LIMIT \
      or zinfo.compress_size > ZIP64_LIMIT:
      extra.append(zinfo.file_size)
      extra.append(zinfo.compress_size)
      file_size = 0xffffffff
      compress_size = 0xffffffff
      else:
      file_size = zinfo.file_size
      compress_size = zinfo.compress_size if zinfo.header_offset > ZIP64_LIMIT:
      extra.append(zinfo.header_offset)
      header_offset = 0xffffffffL
      else:
      header_offset = zinfo.header_offset extra_data = zinfo.extra
      if extra:
      # Append a ZIP64 field to the extra's
      extra_data = struct.pack(
      '<HH' + 'Q'*len(extra),
      1, 8*len(extra), *extra) + extra_data extract_version = max(45, zinfo.extract_version)
      create_version = max(45, zinfo.create_version)
      else:
      extract_version = zinfo.extract_version
      create_version = zinfo.create_version try:
      filename, flag_bits = zinfo._encodeFilenameFlags()
      centdir = struct.pack(structCentralDir,
      stringCentralDir, create_version,
      zinfo.create_system, extract_version, zinfo.reserved,
      flag_bits, zinfo.compress_type, dostime, dosdate,
      zinfo.CRC, compress_size, file_size,
      len(filename), len(extra_data), len(zinfo.comment),
      0, zinfo.internal_attr, zinfo.external_attr,
      header_offset)
      except DeprecationWarning:
      print >>sys.stderr, (structCentralDir,
      stringCentralDir, create_version,
      zinfo.create_system, extract_version, zinfo.reserved,
      zinfo.flag_bits, zinfo.compress_type, dostime, dosdate,
      zinfo.CRC, compress_size, file_size,
      len(zinfo.filename), len(extra_data), len(zinfo.comment),
      0, zinfo.internal_attr, zinfo.external_attr,
      header_offset)
      raise
      self.fp.write(centdir)
      self.fp.write(filename)
      self.fp.write(extra_data)
      self.fp.write(zinfo.comment) pos2 = self.fp.tell()
      # Write end-of-zip-archive record
      centDirCount = len(self.filelist)
      centDirSize = pos2 - pos1
      centDirOffset = pos1
      requires_zip64 = None
      if centDirCount > ZIP_FILECOUNT_LIMIT:
      requires_zip64 = "Files count"
      elif centDirOffset > ZIP64_LIMIT:
      requires_zip64 = "Central directory offset"
      elif centDirSize > ZIP64_LIMIT:
      requires_zip64 = "Central directory size"
      if requires_zip64:
      # Need to write the ZIP64 end-of-archive records
      if not self._allowZip64:
      raise LargeZipFile(requires_zip64 +
      " would require ZIP64 extensions")
      zip64endrec = struct.pack(
      structEndArchive64, stringEndArchive64,
      44, 45, 45, 0, 0, centDirCount, centDirCount,
      centDirSize, centDirOffset)
      self.fp.write(zip64endrec) zip64locrec = struct.pack(
      structEndArchive64Locator,
      stringEndArchive64Locator, 0, pos2, 1)
      self.fp.write(zip64locrec)
      centDirCount = min(centDirCount, 0xFFFF)
      centDirSize = min(centDirSize, 0xFFFFFFFF)
      centDirOffset = min(centDirOffset, 0xFFFFFFFF) endrec = struct.pack(structEndArchive, stringEndArchive,
      0, 0, centDirCount, centDirCount,
      centDirSize, centDirOffset, len(self._comment))
      self.fp.write(endrec)
      self.fp.write(self._comment)
      self.fp.flush()
      finally:
      fp = self.fp
      self.fp = None
      if not self._filePassed:
      fp.close() ZipFile

      ZipFile

      class TarFile(object):
      """The TarFile Class provides an interface to tar archives.
      """ debug = 0 # May be set from 0 (no msgs) to 3 (all msgs) dereference = False # If true, add content of linked file to the
      # tar file, else the link. ignore_zeros = False # If true, skips empty or invalid blocks and
      # continues processing. errorlevel = 1 # If 0, fatal errors only appear in debug
      # messages (if debug >= 0). If > 0, errors
      # are passed to the caller as exceptions. format = DEFAULT_FORMAT # The format to use when creating an archive. encoding = ENCODING # Encoding for 8-bit character strings. errors = None # Error handler for unicode conversion. tarinfo = TarInfo # The default TarInfo class to use. fileobject = ExFileObject # The default ExFileObject class to use. def __init__(self, name=None, mode="r", fileobj=None, format=None,
      tarinfo=None, dereference=None, ignore_zeros=None, encoding=None,
      errors=None, pax_headers=None, debug=None, errorlevel=None):
      """Open an (uncompressed) tar archive `name'. `mode' is either 'r' to
      read from an existing archive, 'a' to append data to an existing
      file or 'w' to create a new file overwriting an existing one. `mode'
      defaults to 'r'.
      If `fileobj' is given, it is used for reading or writing data. If it
      can be determined, `mode' is overridden by `fileobj's mode.
      `fileobj' is not closed, when TarFile is closed.
      """
      modes = {"r": "rb", "a": "r+b", "w": "wb"}
      if mode not in modes:
      raise ValueError("mode must be 'r', 'a' or 'w'")
      self.mode = mode
      self._mode = modes[mode] if not fileobj:
      if self.mode == "a" and not os.path.exists(name):
      # Create nonexistent files in append mode.
      self.mode = "w"
      self._mode = "wb"
      fileobj = bltn_open(name, self._mode)
      self._extfileobj = False
      else:
      if name is None and hasattr(fileobj, "name"):
      name = fileobj.name
      if hasattr(fileobj, "mode"):
      self._mode = fileobj.mode
      self._extfileobj = True
      self.name = os.path.abspath(name) if name else None
      self.fileobj = fileobj # Init attributes.
      if format is not None:
      self.format = format
      if tarinfo is not None:
      self.tarinfo = tarinfo
      if dereference is not None:
      self.dereference = dereference
      if ignore_zeros is not None:
      self.ignore_zeros = ignore_zeros
      if encoding is not None:
      self.encoding = encoding if errors is not None:
      self.errors = errors
      elif mode == "r":
      self.errors = "utf-8"
      else:
      self.errors = "strict" if pax_headers is not None and self.format == PAX_FORMAT:
      self.pax_headers = pax_headers
      else:
      self.pax_headers = {} if debug is not None:
      self.debug = debug
      if errorlevel is not None:
      self.errorlevel = errorlevel # Init datastructures.
      self.closed = False
      self.members = [] # list of members as TarInfo objects
      self._loaded = False # flag if all members have been read
      self.offset = self.fileobj.tell()
      # current position in the archive file
      self.inodes = {} # dictionary caching the inodes of
      # archive members already added try:
      if self.mode == "r":
      self.firstmember = None
      self.firstmember = self.next() if self.mode == "a":
      # Move to the end of the archive,
      # before the first empty block.
      while True:
      self.fileobj.seek(self.offset)
      try:
      tarinfo = self.tarinfo.fromtarfile(self)
      self.members.append(tarinfo)
      except EOFHeaderError:
      self.fileobj.seek(self.offset)
      break
      except HeaderError, e:
      raise ReadError(str(e)) if self.mode in "aw":
      self._loaded = True if self.pax_headers:
      buf = self.tarinfo.create_pax_global_header(self.pax_headers.copy())
      self.fileobj.write(buf)
      self.offset += len(buf)
      except:
      if not self._extfileobj:
      self.fileobj.close()
      self.closed = True
      raise def _getposix(self):
      return self.format == USTAR_FORMAT
      def _setposix(self, value):
      import warnings
      warnings.warn("use the format attribute instead", DeprecationWarning,
      2)
      if value:
      self.format = USTAR_FORMAT
      else:
      self.format = GNU_FORMAT
      posix = property(_getposix, _setposix) #--------------------------------------------------------------------------
      # Below are the classmethods which act as alternate constructors to the
      # TarFile class. The open() method is the only one that is needed for
      # public use; it is the "super"-constructor and is able to select an
      # adequate "sub"-constructor for a particular compression using the mapping
      # from OPEN_METH.
      #
      # This concept allows one to subclass TarFile without losing the comfort of
      # the super-constructor. A sub-constructor is registered and made available
      # by adding it to the mapping in OPEN_METH. @classmethod
      def open(cls, name=None, mode="r", fileobj=None, bufsize=RECORDSIZE, **kwargs):
      """Open a tar archive for reading, writing or appending. Return
      an appropriate TarFile class. mode:
      'r' or 'r:*' open for reading with transparent compression
      'r:' open for reading exclusively uncompressed
      'r:gz' open for reading with gzip compression
      'r:bz2' open for reading with bzip2 compression
      'a' or 'a:' open for appending, creating the file if necessary
      'w' or 'w:' open for writing without compression
      'w:gz' open for writing with gzip compression
      'w:bz2' open for writing with bzip2 compression 'r|*' open a stream of tar blocks with transparent compression
      'r|' open an uncompressed stream of tar blocks for reading
      'r|gz' open a gzip compressed stream of tar blocks
      'r|bz2' open a bzip2 compressed stream of tar blocks
      'w|' open an uncompressed stream for writing
      'w|gz' open a gzip compressed stream for writing
      'w|bz2' open a bzip2 compressed stream for writing
      """ if not name and not fileobj:
      raise ValueError("nothing to open") if mode in ("r", "r:*"):
      # Find out which *open() is appropriate for opening the file.
      for comptype in cls.OPEN_METH:
      func = getattr(cls, cls.OPEN_METH[comptype])
      if fileobj is not None:
      saved_pos = fileobj.tell()
      try:
      return func(name, "r", fileobj, **kwargs)
      except (ReadError, CompressionError), e:
      if fileobj is not None:
      fileobj.seek(saved_pos)
      continue
      raise ReadError("file could not be opened successfully") elif ":" in mode:
      filemode, comptype = mode.split(":", 1)
      filemode = filemode or "r"
      comptype = comptype or "tar" # Select the *open() function according to
      # given compression.
      if comptype in cls.OPEN_METH:
      func = getattr(cls, cls.OPEN_METH[comptype])
      else:
      raise CompressionError("unknown compression type %r" % comptype)
      return func(name, filemode, fileobj, **kwargs) elif "|" in mode:
      filemode, comptype = mode.split("|", 1)
      filemode = filemode or "r"
      comptype = comptype or "tar" if filemode not in ("r", "w"):
      raise ValueError("mode must be 'r' or 'w'") stream = _Stream(name, filemode, comptype, fileobj, bufsize)
      try:
      t = cls(name, filemode, stream, **kwargs)
      except:
      stream.close()
      raise
      t._extfileobj = False
      return t elif mode in ("a", "w"):
      return cls.taropen(name, mode, fileobj, **kwargs) raise ValueError("undiscernible mode") @classmethod
      def taropen(cls, name, mode="r", fileobj=None, **kwargs):
      """Open uncompressed tar archive name for reading or writing.
      """
      if mode not in ("r", "a", "w"):
      raise ValueError("mode must be 'r', 'a' or 'w'")
      return cls(name, mode, fileobj, **kwargs) @classmethod
      def gzopen(cls, name, mode="r", fileobj=None, compresslevel=9, **kwargs):
      """Open gzip compressed tar archive name for reading or writing.
      Appending is not allowed.
      """
      if mode not in ("r", "w"):
      raise ValueError("mode must be 'r' or 'w'") try:
      import gzip
      gzip.GzipFile
      except (ImportError, AttributeError):
      raise CompressionError("gzip module is not available") try:
      fileobj = gzip.GzipFile(name, mode, compresslevel, fileobj)
      except OSError:
      if fileobj is not None and mode == 'r':
      raise ReadError("not a gzip file")
      raise try:
      t = cls.taropen(name, mode, fileobj, **kwargs)
      except IOError:
      fileobj.close()
      if mode == 'r':
      raise ReadError("not a gzip file")
      raise
      except:
      fileobj.close()
      raise
      t._extfileobj = False
      return t @classmethod
      def bz2open(cls, name, mode="r", fileobj=None, compresslevel=9, **kwargs):
      """Open bzip2 compressed tar archive name for reading or writing.
      Appending is not allowed.
      """
      if mode not in ("r", "w"):
      raise ValueError("mode must be 'r' or 'w'.") try:
      import bz2
      except ImportError:
      raise CompressionError("bz2 module is not available") if fileobj is not None:
      fileobj = _BZ2Proxy(fileobj, mode)
      else:
      fileobj = bz2.BZ2File(name, mode, compresslevel=compresslevel) try:
      t = cls.taropen(name, mode, fileobj, **kwargs)
      except (IOError, EOFError):
      fileobj.close()
      if mode == 'r':
      raise ReadError("not a bzip2 file")
      raise
      except:
      fileobj.close()
      raise
      t._extfileobj = False
      return t # All *open() methods are registered here.
      OPEN_METH = {
      "tar": "taropen", # uncompressed tar
      "gz": "gzopen", # gzip compressed tar
      "bz2": "bz2open" # bzip2 compressed tar
      } #--------------------------------------------------------------------------
      # The public methods which TarFile provides: def close(self):
      """Close the TarFile. In write-mode, two finishing zero blocks are
      appended to the archive.
      """
      if self.closed:
      return if self.mode in "aw":
      self.fileobj.write(NUL * (BLOCKSIZE * 2))
      self.offset += (BLOCKSIZE * 2)
      # fill up the end with zero-blocks
      # (like option -b20 for tar does)
      blocks, remainder = divmod(self.offset, RECORDSIZE)
      if remainder > 0:
      self.fileobj.write(NUL * (RECORDSIZE - remainder)) if not self._extfileobj:
      self.fileobj.close()
      self.closed = True def getmember(self, name):
      """Return a TarInfo object for member `name'. If `name' can not be
      found in the archive, KeyError is raised. If a member occurs more
      than once in the archive, its last occurrence is assumed to be the
      most up-to-date version.
      """
      tarinfo = self._getmember(name)
      if tarinfo is None:
      raise KeyError("filename %r not found" % name)
      return tarinfo def getmembers(self):
      """Return the members of the archive as a list of TarInfo objects. The
      list has the same order as the members in the archive.
      """
      self._check()
      if not self._loaded: # if we want to obtain a list of
      self._load() # all members, we first have to
      # scan the whole archive.
      return self.members def getnames(self):
      """Return the members of the archive as a list of their names. It has
      the same order as the list returned by getmembers().
      """
      return [tarinfo.name for tarinfo in self.getmembers()] def gettarinfo(self, name=None, arcname=None, fileobj=None):
      """Create a TarInfo object for either the file `name' or the file
      object `fileobj' (using os.fstat on its file descriptor). You can
      modify some of the TarInfo's attributes before you add it using
      addfile(). If given, `arcname' specifies an alternative name for the
      file in the archive.
      """
      self._check("aw") # When fileobj is given, replace name by
      # fileobj's real name.
      if fileobj is not None:
      name = fileobj.name # Building the name of the member in the archive.
      # Backward slashes are converted to forward slashes,
      # Absolute paths are turned to relative paths.
      if arcname is None:
      arcname = name
      drv, arcname = os.path.splitdrive(arcname)
      arcname = arcname.replace(os.sep, "/")
      arcname = arcname.lstrip("/") # Now, fill the TarInfo object with
      # information specific for the file.
      tarinfo = self.tarinfo()
      tarinfo.tarfile = self # Use os.stat or os.lstat, depending on platform
      # and if symlinks shall be resolved.
      if fileobj is None:
      if hasattr(os, "lstat") and not self.dereference:
      statres = os.lstat(name)
      else:
      statres = os.stat(name)
      else:
      statres = os.fstat(fileobj.fileno())
      linkname = "" stmd = statres.st_mode
      if stat.S_ISREG(stmd):
      inode = (statres.st_ino, statres.st_dev)
      if not self.dereference and statres.st_nlink > 1 and \
      inode in self.inodes and arcname != self.inodes[inode]:
      # Is it a hardlink to an already
      # archived file?
      type = LNKTYPE
      linkname = self.inodes[inode]
      else:
      # The inode is added only if its valid.
      # For win32 it is always 0.
      type = REGTYPE
      if inode[0]:
      self.inodes[inode] = arcname
      elif stat.S_ISDIR(stmd):
      type = DIRTYPE
      elif stat.S_ISFIFO(stmd):
      type = FIFOTYPE
      elif stat.S_ISLNK(stmd):
      type = SYMTYPE
      linkname = os.readlink(name)
      elif stat.S_ISCHR(stmd):
      type = CHRTYPE
      elif stat.S_ISBLK(stmd):
      type = BLKTYPE
      else:
      return None # Fill the TarInfo object with all
      # information we can get.
      tarinfo.name = arcname
      tarinfo.mode = stmd
      tarinfo.uid = statres.st_uid
      tarinfo.gid = statres.st_gid
      if type == REGTYPE:
      tarinfo.size = statres.st_size
      else:
      tarinfo.size = 0L
      tarinfo.mtime = statres.st_mtime
      tarinfo.type = type
      tarinfo.linkname = linkname
      if pwd:
      try:
      tarinfo.uname = pwd.getpwuid(tarinfo.uid)[0]
      except KeyError:
      pass
      if grp:
      try:
      tarinfo.gname = grp.getgrgid(tarinfo.gid)[0]
      except KeyError:
      pass if type in (CHRTYPE, BLKTYPE):
      if hasattr(os, "major") and hasattr(os, "minor"):
      tarinfo.devmajor = os.major(statres.st_rdev)
      tarinfo.devminor = os.minor(statres.st_rdev)
      return tarinfo def list(self, verbose=True):
      """Print a table of contents to sys.stdout. If `verbose' is False, only
      the names of the members are printed. If it is True, an `ls -l'-like
      output is produced.
      """
      self._check() for tarinfo in self:
      if verbose:
      print filemode(tarinfo.mode),
      print "%s/%s" % (tarinfo.uname or tarinfo.uid,
      tarinfo.gname or tarinfo.gid),
      if tarinfo.ischr() or tarinfo.isblk():
      print "%10s" % ("%d,%d" \
      % (tarinfo.devmajor, tarinfo.devminor)),
      else:
      print "%10d" % tarinfo.size,
      print "%d-%02d-%02d %02d:%02d:%02d" \
      % time.localtime(tarinfo.mtime)[:6], print tarinfo.name + ("/" if tarinfo.isdir() else ""), if verbose:
      if tarinfo.issym():
      print "->", tarinfo.linkname,
      if tarinfo.islnk():
      print "link to", tarinfo.linkname,
      print def add(self, name, arcname=None, recursive=True, exclude=None, filter=None):
      """Add the file `name' to the archive. `name' may be any type of file
      (directory, fifo, symbolic link, etc.). If given, `arcname'
      specifies an alternative name for the file in the archive.
      Directories are added recursively by default. This can be avoided by
      setting `recursive' to False. `exclude' is a function that should
      return True for each filename to be excluded. `filter' is a function
      that expects a TarInfo object argument and returns the changed
      TarInfo object, if it returns None the TarInfo object will be
      excluded from the archive.
      """
      self._check("aw") if arcname is None:
      arcname = name # Exclude pathnames.
      if exclude is not None:
      import warnings
      warnings.warn("use the filter argument instead",
      DeprecationWarning, 2)
      if exclude(name):
      self._dbg(2, "tarfile: Excluded %r" % name)
      return # Skip if somebody tries to archive the archive...
      if self.name is not None and os.path.abspath(name) == self.name:
      self._dbg(2, "tarfile: Skipped %r" % name)
      return self._dbg(1, name) # Create a TarInfo object from the file.
      tarinfo = self.gettarinfo(name, arcname) if tarinfo is None:
      self._dbg(1, "tarfile: Unsupported type %r" % name)
      return # Change or exclude the TarInfo object.
      if filter is not None:
      tarinfo = filter(tarinfo)
      if tarinfo is None:
      self._dbg(2, "tarfile: Excluded %r" % name)
      return # Append the tar header and data to the archive.
      if tarinfo.isreg():
      with bltn_open(name, "rb") as f:
      self.addfile(tarinfo, f) elif tarinfo.isdir():
      self.addfile(tarinfo)
      if recursive:
      for f in os.listdir(name):
      self.add(os.path.join(name, f), os.path.join(arcname, f),
      recursive, exclude, filter) else:
      self.addfile(tarinfo) def addfile(self, tarinfo, fileobj=None):
      """Add the TarInfo object `tarinfo' to the archive. If `fileobj' is
      given, tarinfo.size bytes are read from it and added to the archive.
      You can create TarInfo objects using gettarinfo().
      On Windows platforms, `fileobj' should always be opened with mode
      'rb' to avoid irritation about the file size.
      """
      self._check("aw") tarinfo = copy.copy(tarinfo) buf = tarinfo.tobuf(self.format, self.encoding, self.errors)
      self.fileobj.write(buf)
      self.offset += len(buf) # If there's data to follow, append it.
      if fileobj is not None:
      copyfileobj(fileobj, self.fileobj, tarinfo.size)
      blocks, remainder = divmod(tarinfo.size, BLOCKSIZE)
      if remainder > 0:
      self.fileobj.write(NUL * (BLOCKSIZE - remainder))
      blocks += 1
      self.offset += blocks * BLOCKSIZE self.members.append(tarinfo) def extractall(self, path=".", members=None):
      """Extract all members from the archive to the current working
      directory and set owner, modification time and permissions on
      directories afterwards. `path' specifies a different directory
      to extract to. `members' is optional and must be a subset of the
      list returned by getmembers().
      """
      directories = [] if members is None:
      members = self for tarinfo in members:
      if tarinfo.isdir():
      # Extract directories with a safe mode.
      directories.append(tarinfo)
      tarinfo = copy.copy(tarinfo)
      tarinfo.mode = 0700
      self.extract(tarinfo, path) # Reverse sort directories.
      directories.sort(key=operator.attrgetter('name'))
      directories.reverse() # Set correct owner, mtime and filemode on directories.
      for tarinfo in directories:
      dirpath = os.path.join(path, tarinfo.name)
      try:
      self.chown(tarinfo, dirpath)
      self.utime(tarinfo, dirpath)
      self.chmod(tarinfo, dirpath)
      except ExtractError, e:
      if self.errorlevel > 1:
      raise
      else:
      self._dbg(1, "tarfile: %s" % e) def extract(self, member, path=""):
      """Extract a member from the archive to the current working directory,
      using its full name. Its file information is extracted as accurately
      as possible. `member' may be a filename or a TarInfo object. You can
      specify a different directory using `path'.
      """
      self._check("r") if isinstance(member, basestring):
      tarinfo = self.getmember(member)
      else:
      tarinfo = member # Prepare the link target for makelink().
      if tarinfo.islnk():
      tarinfo._link_target = os.path.join(path, tarinfo.linkname) try:
      self._extract_member(tarinfo, os.path.join(path, tarinfo.name))
      except EnvironmentError, e:
      if self.errorlevel > 0:
      raise
      else:
      if e.filename is None:
      self._dbg(1, "tarfile: %s" % e.strerror)
      else:
      self._dbg(1, "tarfile: %s %r" % (e.strerror, e.filename))
      except ExtractError, e:
      if self.errorlevel > 1:
      raise
      else:
      self._dbg(1, "tarfile: %s" % e) def extractfile(self, member):
      """Extract a member from the archive as a file object. `member' may be
      a filename or a TarInfo object. If `member' is a regular file, a
      file-like object is returned. If `member' is a link, a file-like
      object is constructed from the link's target. If `member' is none of
      the above, None is returned.
      The file-like object is read-only and provides the following
      methods: read(), readline(), readlines(), seek() and tell()
      """
      self._check("r") if isinstance(member, basestring):
      tarinfo = self.getmember(member)
      else:
      tarinfo = member if tarinfo.isreg():
      return self.fileobject(self, tarinfo) elif tarinfo.type not in SUPPORTED_TYPES:
      # If a member's type is unknown, it is treated as a
      # regular file.
      return self.fileobject(self, tarinfo) elif tarinfo.islnk() or tarinfo.issym():
      if isinstance(self.fileobj, _Stream):
      # A small but ugly workaround for the case that someone tries
      # to extract a (sym)link as a file-object from a non-seekable
      # stream of tar blocks.
      raise StreamError("cannot extract (sym)link as file object")
      else:
      # A (sym)link's file object is its target's file object.
      return self.extractfile(self._find_link_target(tarinfo))
      else:
      # If there's no data associated with the member (directory, chrdev,
      # blkdev, etc.), return None instead of a file object.
      return None def _extract_member(self, tarinfo, targetpath):
      """Extract the TarInfo object tarinfo to a physical
      file called targetpath.
      """
      # Fetch the TarInfo object for the given name
      # and build the destination pathname, replacing
      # forward slashes to platform specific separators.
      targetpath = targetpath.rstrip("/")
      targetpath = targetpath.replace("/", os.sep) # Create all upper directories.
      upperdirs = os.path.dirname(targetpath)
      if upperdirs and not os.path.exists(upperdirs):
      # Create directories that are not part of the archive with
      # default permissions.
      os.makedirs(upperdirs) if tarinfo.islnk() or tarinfo.issym():
      self._dbg(1, "%s -> %s" % (tarinfo.name, tarinfo.linkname))
      else:
      self._dbg(1, tarinfo.name) if tarinfo.isreg():
      self.makefile(tarinfo, targetpath)
      elif tarinfo.isdir():
      self.makedir(tarinfo, targetpath)
      elif tarinfo.isfifo():
      self.makefifo(tarinfo, targetpath)
      elif tarinfo.ischr() or tarinfo.isblk():
      self.makedev(tarinfo, targetpath)
      elif tarinfo.islnk() or tarinfo.issym():
      self.makelink(tarinfo, targetpath)
      elif tarinfo.type not in SUPPORTED_TYPES:
      self.makeunknown(tarinfo, targetpath)
      else:
      self.makefile(tarinfo, targetpath) self.chown(tarinfo, targetpath)
      if not tarinfo.issym():
      self.chmod(tarinfo, targetpath)
      self.utime(tarinfo, targetpath) #--------------------------------------------------------------------------
      # Below are the different file methods. They are called via
      # _extract_member() when extract() is called. They can be replaced in a
      # subclass to implement other functionality. def makedir(self, tarinfo, targetpath):
      """Make a directory called targetpath.
      """
      try:
      # Use a safe mode for the directory, the real mode is set
      # later in _extract_member().
      os.mkdir(targetpath, 0700)
      except EnvironmentError, e:
      if e.errno != errno.EEXIST:
      raise def makefile(self, tarinfo, targetpath):
      """Make a file called targetpath.
      """
      source = self.extractfile(tarinfo)
      try:
      with bltn_open(targetpath, "wb") as target:
      copyfileobj(source, target)
      finally:
      source.close() def makeunknown(self, tarinfo, targetpath):
      """Make a file from a TarInfo object with an unknown type
      at targetpath.
      """
      self.makefile(tarinfo, targetpath)
      self._dbg(1, "tarfile: Unknown file type %r, " \
      "extracted as regular file." % tarinfo.type) def makefifo(self, tarinfo, targetpath):
      """Make a fifo called targetpath.
      """
      if hasattr(os, "mkfifo"):
      os.mkfifo(targetpath)
      else:
      raise ExtractError("fifo not supported by system") def makedev(self, tarinfo, targetpath):
      """Make a character or block device called targetpath.
      """
      if not hasattr(os, "mknod") or not hasattr(os, "makedev"):
      raise ExtractError("special devices not supported by system") mode = tarinfo.mode
      if tarinfo.isblk():
      mode |= stat.S_IFBLK
      else:
      mode |= stat.S_IFCHR os.mknod(targetpath, mode,
      os.makedev(tarinfo.devmajor, tarinfo.devminor)) def makelink(self, tarinfo, targetpath):
      """Make a (symbolic) link called targetpath. If it cannot be created
      (platform limitation), we try to make a copy of the referenced file
      instead of a link.
      """
      if hasattr(os, "symlink") and hasattr(os, "link"):
      # For systems that support symbolic and hard links.
      if tarinfo.issym():
      if os.path.lexists(targetpath):
      os.unlink(targetpath)
      os.symlink(tarinfo.linkname, targetpath)
      else:
      # See extract().
      if os.path.exists(tarinfo._link_target):
      if os.path.lexists(targetpath):
      os.unlink(targetpath)
      os.link(tarinfo._link_target, targetpath)
      else:
      self._extract_member(self._find_link_target(tarinfo), targetpath)
      else:
      try:
      self._extract_member(self._find_link_target(tarinfo), targetpath)
      except KeyError:
      raise ExtractError("unable to resolve link inside archive") def chown(self, tarinfo, targetpath):
      """Set owner of targetpath according to tarinfo.
      """
      if pwd and hasattr(os, "geteuid") and os.geteuid() == 0:
      # We have to be root to do so.
      try:
      g = grp.getgrnam(tarinfo.gname)[2]
      except KeyError:
      g = tarinfo.gid
      try:
      u = pwd.getpwnam(tarinfo.uname)[2]
      except KeyError:
      u = tarinfo.uid
      try:
      if tarinfo.issym() and hasattr(os, "lchown"):
      os.lchown(targetpath, u, g)
      else:
      if sys.platform != "os2emx":
      os.chown(targetpath, u, g)
      except EnvironmentError, e:
      raise ExtractError("could not change owner") def chmod(self, tarinfo, targetpath):
      """Set file permissions of targetpath according to tarinfo.
      """
      if hasattr(os, 'chmod'):
      try:
      os.chmod(targetpath, tarinfo.mode)
      except EnvironmentError, e:
      raise ExtractError("could not change mode") def utime(self, tarinfo, targetpath):
      """Set modification time of targetpath according to tarinfo.
      """
      if not hasattr(os, 'utime'):
      return
      try:
      os.utime(targetpath, (tarinfo.mtime, tarinfo.mtime))
      except EnvironmentError, e:
      raise ExtractError("could not change modification time") #--------------------------------------------------------------------------
      def next(self):
      """Return the next member of the archive as a TarInfo object, when
      TarFile is opened for reading. Return None if there is no more
      available.
      """
      self._check("ra")
      if self.firstmember is not None:
      m = self.firstmember
      self.firstmember = None
      return m # Read the next block.
      self.fileobj.seek(self.offset)
      tarinfo = None
      while True:
      try:
      tarinfo = self.tarinfo.fromtarfile(self)
      except EOFHeaderError, e:
      if self.ignore_zeros:
      self._dbg(2, "0x%X: %s" % (self.offset, e))
      self.offset += BLOCKSIZE
      continue
      except InvalidHeaderError, e:
      if self.ignore_zeros:
      self._dbg(2, "0x%X: %s" % (self.offset, e))
      self.offset += BLOCKSIZE
      continue
      elif self.offset == 0:
      raise ReadError(str(e))
      except EmptyHeaderError:
      if self.offset == 0:
      raise ReadError("empty file")
      except TruncatedHeaderError, e:
      if self.offset == 0:
      raise ReadError(str(e))
      except SubsequentHeaderError, e:
      raise ReadError(str(e))
      break if tarinfo is not None:
      self.members.append(tarinfo)
      else:
      self._loaded = True return tarinfo #--------------------------------------------------------------------------
      # Little helper methods: def _getmember(self, name, tarinfo=None, normalize=False):
      """Find an archive member by name from bottom to top.
      If tarinfo is given, it is used as the starting point.
      """
      # Ensure that all members have been loaded.
      members = self.getmembers() # Limit the member search list up to tarinfo.
      if tarinfo is not None:
      members = members[:members.index(tarinfo)] if normalize:
      name = os.path.normpath(name) for member in reversed(members):
      if normalize:
      member_name = os.path.normpath(member.name)
      else:
      member_name = member.name if name == member_name:
      return member def _load(self):
      """Read through the entire archive file and look for readable
      members.
      """
      while True:
      tarinfo = self.next()
      if tarinfo is None:
      break
      self._loaded = True def _check(self, mode=None):
      """Check if TarFile is still open, and if the operation's mode
      corresponds to TarFile's mode.
      """
      if self.closed:
      raise IOError("%s is closed" % self.__class__.__name__)
      if mode is not None and self.mode not in mode:
      raise IOError("bad operation for mode %r" % self.mode) def _find_link_target(self, tarinfo):
      """Find the target member of a symlink or hardlink member in the
      archive.
      """
      if tarinfo.issym():
      # Always search the entire archive.
      linkname = "/".join(filter(None, (os.path.dirname(tarinfo.name), tarinfo.linkname)))
      limit = None
      else:
      # Search the archive before the link, because a hard link is
      # just a reference to an already archived file.
      linkname = tarinfo.linkname
      limit = tarinfo member = self._getmember(linkname, tarinfo=limit, normalize=True)
      if member is None:
      raise KeyError("linkname %r not found" % linkname)
      return member def __iter__(self):
      """Provide an iterator object.
      """
      if self._loaded:
      return iter(self.members)
      else:
      return TarIter(self) def _dbg(self, level, msg):
      """Write debugging output to sys.stderr.
      """
      if level <= self.debug:
      print >> sys.stderr, msg def __enter__(self):
      self._check()
      return self def __exit__(self, type, value, traceback):
      if type is None:
      self.close()
      else:
      # An exception occurred. We must not call close() because
      # it would try to write end-of-archive blocks and padding.
      if not self._extfileobj:
      self.fileobj.close()
      self.closed = True
      # class TarFile TarFile

      TarFile

shuit模块的更多相关文章

  1. 第二十天 模块 sys os os下path settings random shuit

    一.sys模块 1.sys.argv 命令行参数List,第一个元素是程序本身路径 2.sys.exit(n) 退出程序,正常退出时exit(0) 3.sys.version 获取Pythonn解释程 ...

  2. npm 私有模块的管理使用

    你可以使用 NPM 命令行工具来管理你在 NPM 仓库的私有模块代码,这使得在项目中使用公共模块变的更加方便. 开始前的工作 你需要一个 2.7.0 以上版本的 npm ,并且需要有一个可以登陆 np ...

  3. node.js学习(三)简单的node程序&&模块简单使用&&commonJS规范&&深入理解模块原理

    一.一个简单的node程序 1.新建一个txt文件 2.修改后缀 修改之后会弹出这个,点击"是" 3.运行test.js 源文件 使用node.js运行之后的. 如果该路径下没有该 ...

  4. ES6模块import细节

    写在前面,目前浏览器对ES6的import支持还不是很好,需要用bable转译. ES6引入外部模块分两种情况: 1.导入外部的变量或函数等: import {firstName, lastName, ...

  5. Python标准模块--ContextManager

    1 模块简介 在数年前,Python 2.5 加入了一个非常特殊的关键字,就是with.with语句允许开发者创建上下文管理器.什么是上下文管理器?上下文管理器就是允许你可以自动地开始和结束一些事情. ...

  6. Python标准模块--Unicode

    1 模块简介 Python 3中最大的变化之一就是删除了Unicode类型.在Python 2中,有str类型和unicode类型,例如, Python 2.7.6 (default, Oct 26 ...

  7. Python标准模块--Iterators和Generators

    1 模块简介 当你开始使用Python编程时,你或许已经使用了iterators(迭代器)和generators(生成器),你当时可能并没有意识到.在本篇博文中,我们将会学习迭代器和生成器是什么.当然 ...

  8. 自己实现一个javascript事件模块

    nodejs中的事件模块 nodejs中有一个events模块,用来给别的函数对象提供绑定事件.触发事件的能力.这个别的函数的对象,我把它叫做事件宿主对象(非权威叫法),其原理是把宿主函数的原型链指向 ...

  9. 理解nodejs模块的scope

    描述 原文档地址:https://docs.npmjs.com/misc/scope 所有npm模块都有name,有的模块的name还有scope.scope的命名规则和name差不多,同样不能有ur ...

随机推荐

  1. nginx的proxy_cache缓存配置

    为什么要做web cache,我想大家最主要的是解决流量的压力.随着网站流量的提升,如果只是单台机器既处理静态文件,又处理动态脚本,显然效率很难上升,不能处理日益上涨的流量压力.与此同时某些网站的页面 ...

  2. Pmon (LS1B)start.s

    loongson ls1b FPGA验证 只有DDR flash UART pmon移植 和原版本相比,DDR controller和ls1b不一致. /* $Id: start.S,v 1.1.1. ...

  3. __attribute__系列之介绍篇

    1.什么是__attribute__? __attribute__机制是GNU C的一大特色,它可以设置函数属性.变量属性和类型属性等.可以通过它们向编译器提供更多数据,帮助编译器执行优化等. 2._ ...

  4. java - day07 - PrimeNum

    判断质数 package day06; import java.util.Scanner; //验证质数 public class primeNum { public static void main ...

  5. oracle命令登录数据库

    sqlplus aa/aa@jdbc:oracle:thin:@10.200.130.111:1521:nbact 或者 sqlplus aa/aa@nbact

  6. HibernateTools实现pojo类 数据库schma mapping映射的相互转换 二

    接着上一篇博客:HibernateTools实现pojo类 数据库schma mapping映射的相互转换 思路二:由数据库表,生成Mapping映射文件和POJO类. 尽管能够实现,但个人觉着先设计 ...

  7. Spring MVC控制器类名称处理映射

    以下示例显示如何使用Spring Web MVC框架使用控制器类名称处理程序映射. ControllerClassNameHandlerMapping类是基于约定的处理程序映射类,它将URL请求映射到 ...

  8. wchar与char字符转换的探究

    在Xcode 模拟器环境下.測试wchar_t与char的转换: void convert_test() { setlocale(LC_ALL, "zh_CN.UTF-8"); c ...

  9. 第4步:创建RAC共享磁盘组

    方法一:使用asmdevices(推荐使用,但不适用EMC Powerpath) )查看硬盘的SCSI号,两个机器认到的/dev/sda对应在实际的物理盘可能不是一块,但scsi号肯定是完全一致的. ...

  10. ios如何在当前工程中添加编辑新建的FramesWork

    本文转载至 http://www.apkbus.com/android-131519-1-1.html,感谢原文作者的分享.     naniboy 该用户从未签到   可能很多大牛都见过FaceBo ...