os模块提供了对目录或者文件的新建/删除/查看文件属性,还提供了对文件以及目录的路径操作。比如说:绝对路径,父目录…… 但是,os文件的操作还应该包含移动 复制 打包 压缩 解压等操作,这些os模块都没有提供。
而本文所讲的shutil则就是对os中文件操作的补充。--移动 复制 打包 压缩 解压,
shutil函数功能:
1 shutil.copyfileobj(fsrc, fdst[, length=16*1024])
copy文件内容到另一个文件,可以copy指定大小的内容
先来看看其源代码。
1
2
3
4
5
6
7
|
def copyfileobj(fsrc, fdst, length = 16 * 1024 ):
"""copy data from file-like object fsrc to file-like object fdst"""
while 1 :
buf = fsrc.read(length)
if not buf:
break
fdst.write(buf)
|
注意! 在其中fsrc,fdst都是文件对象,都需要打开后才能进行复制操作
1
2
3
4
|
import shutil
f1 = open ( 'name' , 'r' )
f2 = open ( 'name_copy' , 'w+' )
shutil.copyfileobj(f1,f2,length = 16 * 1024 )
|
2 shutil.copyfile(src,dst)
copy文件内容,是不是感觉上面的文件复制很麻烦?还需要自己手动用open函数打开文件,在这里就不需要了,事实上,copyfile调用了copyfileobj
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
|
def copyfile(src, dst, * , follow_symlinks = True ):
if _samefile(src, dst):
raise SameFileError( "{!r} and {!r} are the same file" . format (src, dst))
for fn in [src, dst]:
try :
st = os.stat(fn)
except OSError:
# File most likely does not exist
pass
else :
# XXX What about other special files? (sockets, devices...)
if stat.S_ISFIFO(st.st_mode):
raise SpecialFileError( "`%s` is a named pipe" % fn)
if not follow_symlinks and os.path.islink(src):
os.symlink(os.readlink(src), dst)
else :
with open (src, 'rb' ) as fsrc:
with open (dst, 'wb' ) as fdst:
copyfileobj(fsrc, fdst)
return dst
|
1
2
|
shutil.copyfile( 'name' , 'name_copy_2' )
#一句就可以实现复制文件内容
|
3 shutil.copymode(src,dst)
仅copy权限,不更改文件内容,组和用户。
1
2
3
4
5
6
7
8
9
10
11
12
|
def copymode(src, dst, * , follow_symlinks = True ):
if not follow_symlinks and os.path.islink(src) and os.path.islink(dst):
if hasattr (os, 'lchmod' ):
stat_func, chmod_func = os.lstat, os.lchmod
else :
return
elif hasattr (os, 'chmod' ):
stat_func, chmod_func = os.stat, os.chmod
else :
return
st = stat_func(src)
chmod_func(dst, stat.S_IMODE(st.st_mode))
|
先看两个文件的权限
1
2
3
4
|
[root@slyoyo python_test] # ls -l
total 4
-rw-r--r--. 1 root root 79 May 14 05:17 test1
-rwxr-xr-x. 1 root root 0 May 14 19:10 test2
|
运行命令
1
2
|
>>> import shutil
>>> shutil.copymode( 'test1' , 'test2' )
|
查看结果
1
2
3
4
|
[root@slyoyo python_test] # ls -l
total 4
-rw-r--r--. 1 root root 79 May 14 05:17 test1
-rw-r--r--. 1 root root 0 May 14 19:10 test2
|
当我们将目标文件换为一个不存在的文件时报错
1
2
3
4
5
6
|
>>> shutil.copymode('test1','test3')
Traceback (most recent call last):
File "<stdin>", line 1, in <module>
File "/usr/local/python/lib/python3.4/shutil.py", line 132, in copymode
chmod_func(dst, stat.S_IMODE(st.st_mode))
FileNotFoundError: [Errno 2] No such file or directory: 'test233'
|
4 shutil.copystat(src,dst)
复制所有的状态信息,包括权限,组,用户,时间等
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
|
def copystat(src, dst, * , follow_symlinks = True ):
def _nop( * args, ns = None , follow_symlinks = None ):
pass
# follow symlinks (aka don't not follow symlinks)
follow = follow_symlinks or not (os.path.islink(src) and os.path.islink(dst))
if follow:
# use the real function if it exists
def lookup(name):
return getattr (os, name, _nop)
else :
# use the real function only if it exists
# *and* it supports follow_symlinks
def lookup(name):
fn = getattr (os, name, _nop)
if fn in os.supports_follow_symlinks:
return fn
return _nop
st = lookup( "stat" )(src, follow_symlinks = follow)
mode = stat.S_IMODE(st.st_mode)
lookup( "utime" )(dst, ns = (st.st_atime_ns, st.st_mtime_ns),
follow_symlinks = follow)
try :
lookup( "chmod" )(dst, mode, follow_symlinks = follow)
except NotImplementedError:
# if we got a NotImplementedError, it's because
# * follow_symlinks=False,
# * lchown() is unavailable, and
# * either
# * fchownat() is unavailable or
# * fchownat() doesn't implement AT_SYMLINK_NOFOLLOW.
# (it returned ENOSUP.)
# therefore we're out of options--we simply cannot chown the
# symlink. give up, suppress the error.
# (which is what shutil always did in this circumstance.)
pass
if hasattr (st, 'st_flags' ):
try :
lookup( "chflags" )(dst, st.st_flags, follow_symlinks = follow)
except OSError as why:
for err in 'EOPNOTSUPP' , 'ENOTSUP' :
if hasattr (errno, err) and why.errno = = getattr (errno, err):
break
else :
raise
_copyxattr(src, dst, follow_symlinks = follow)
|
5 shutil.copy(src,dst)
复制文件的内容以及权限,先copyfile后copymode
1
2
3
4
5
6
7
|
def copy(src, dst, * , follow_symlinks = True ):
if os.path.isdir(dst):
dst = os.path.join(dst, os.path.basename(src))
copyfile(src, dst, follow_symlinks = follow_symlinks)
copymode(src, dst, follow_symlinks = follow_symlinks)
return dst
|
6 shutil.copy2(src,dst)
复制文件的内容以及文件的所有状态信息。先copyfile后copystat
1
2
3
4
5
6
7
8
9
10
11
12
|
def copy2(src, dst, * , follow_symlinks = True ):
"""Copy data and all stat info ("cp -p src dst"). Return the file's
destination."
The destination may be a directory.
If follow_symlinks is false, symlinks won't be followed. This
resembles GNU's "cp -P src dst".
"""
if os.path.isdir(dst):
dst = os.path.join(dst, os.path.basename(src))
copyfile(src, dst, follow_symlinks = follow_symlinks)
copystat(src, dst, follow_symlinks = follow_symlinks)
return dst
|
7 shutil.copytree(src, dst, symlinks=False, ignore=None, copy_function=copy2,ignore_dangling_symlinks=False)
递归的复制文件内容及状态信息
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
|
def copytree(src, dst, symlinks = False , ignore = None , copy_function = copy2,
ignore_dangling_symlinks = False ):
names = os.listdir(src)
if ignore is not None :
ignored_names = ignore(src, names)
else :
ignored_names = set ()
os.makedirs(dst)
errors = []
for name in names:
if name in ignored_names:
continue
srcname = os.path.join(src, name)
dstname = os.path.join(dst, name)
try :
if os.path.islink(srcname):
linkto = os.readlink(srcname)
if symlinks:
# We can't just leave it to `copy_function` because legacy
# code with a custom `copy_function` may rely on copytree
# doing the right thing.
os.symlink(linkto, dstname)
copystat(srcname, dstname, follow_symlinks = not symlinks)
else :
# ignore dangling symlink if the flag is on
if not os.path.exists(linkto) and ignore_dangling_symlinks:
continue
# otherwise let the copy occurs. copy2 will raise an error
if os.path.isdir(srcname):
copytree(srcname, dstname, symlinks, ignore,
copy_function)
else :
copy_function(srcname, dstname)
elif os.path.isdir(srcname):
copytree(srcname, dstname, symlinks, ignore, copy_function)
else :
# Will raise a SpecialFileError for unsupported file types
copy_function(srcname, dstname)
# catch the Error from the recursive copytree so that we can
# continue with other files
except Error as err:
errors.extend(err.args[ 0 ])
except OSError as why:
errors.append((srcname, dstname, str (why)))
try :
copystat(src, dst)
except OSError as why:
# Copying file access times may fail on Windows
if getattr (why, 'winerror' , None ) is None :
errors.append((src, dst, str (why)))
if errors:
raise Error(errors)
return dst
# version vulnerable to race conditions
|
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
|
[root@slyoyo python_test] # tree copytree_test/
copytree_test/
└── test
├── test1
├── test2
└── hahaha
[root@slyoyo test ] # ls -l
total 0
-rw-r--r--. 1 python python 0 May 14 19:36 hahaha
-rw-r--r--. 1 python python 0 May 14 19:36 test1
-rw-r--r--. 1 root root 0 May 14 19:36 test2
>>> shutil.copytree( 'copytree_test' , 'copytree_copy' )
'copytree_copy'
[root@slyoyo python_test] # ls -l
total 12
drwxr-xr-x. 3 root root 4096 May 14 19:36 copytree_copy
drwxr-xr-x. 3 root root 4096 May 14 19:36 copytree_test
-rw-r--r--. 1 python python 79 May 14 05:17 test1
-rw-r--r--. 1 root root 0 May 14 19:10 test2
[root@slyoyo python_test] # tree copytree_copy/
copytree_copy/
└── test
├── hahaha
├── test1
└── test2
|
8 shutil.rmtree(path, ignore_errors=False, onerror=None)
递归地删除文件
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
|
def rmtree(path, ignore_errors = False , onerror = None ):
if ignore_errors:
def onerror( * args):
pass
elif onerror is None :
def onerror( * args):
raise
if _use_fd_functions:
# While the unsafe rmtree works fine on bytes, the fd based does not.
if isinstance (path, bytes):
path = os.fsdecode(path)
# Note: To guard against symlink races, we use the standard
# lstat()/open()/fstat() trick.
try :
orig_st = os.lstat(path)
except Exception:
onerror(os.lstat, path, sys.exc_info())
return
try :
fd = os. open (path, os.O_RDONLY)
except Exception:
onerror(os.lstat, path, sys.exc_info())
return
try :
if os.path.samestat(orig_st, os.fstat(fd)):
_rmtree_safe_fd(fd, path, onerror)
try :
os.rmdir(path)
except OSError:
onerror(os.rmdir, path, sys.exc_info())
else :
try :
# symlinks to directories are forbidden, see bug #1669
raise OSError( "Cannot call rmtree on a symbolic link" )
except OSError:
onerror(os.path.islink, path, sys.exc_info())
finally :
os.close(fd)
else :
return _rmtree_unsafe(path, onerror)
|
9 shutil.move(src, dst)
递归的移动文件
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
|
def move(src, dst):
real_dst = dst
if os.path.isdir(dst):
if _samefile(src, dst):
# We might be on a case insensitive filesystem,
# perform the rename anyway.
os.rename(src, dst)
return
real_dst = os.path.join(dst, _basename(src))
if os.path.exists(real_dst):
raise Error( "Destination path '%s' already exists" % real_dst)
try :
os.rename(src, real_dst)
except OSError:
if os.path.islink(src):
linkto = os.readlink(src)
os.symlink(linkto, real_dst)
os.unlink(src)
elif os.path.isdir(src):
if _destinsrc(src, dst):
raise Error( "Cannot move a directory '%s' into itself '%s'." % (src, dst))
copytree(src, real_dst, symlinks = True )
rmtree(src)
else :
copy2(src, real_dst)
os.unlink(src)
return real_dst
|
10 make_archive(base_name, format, root_dir=None, base_dir=None, verbose=0,dry_run=0, owner=None, group=None, logger=None)
压缩打包
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
|
def make_archive(base_name, format , root_dir = None , base_dir = None , verbose = 0 ,
dry_run = 0 , owner = None , group = None , logger = None ):
save_cwd = os.getcwd()
if root_dir is not None :
if logger is not None :
logger.debug( "changing into '%s'" , root_dir)
base_name = os.path.abspath(base_name)
if not dry_run:
os.chdir(root_dir)
if base_dir is None :
base_dir = os.curdir
kwargs = { 'dry_run' : dry_run, 'logger' : logger}
try :
format_info = _ARCHIVE_FORMATS[ format ]
except KeyError:
raise ValueError( "unknown archive format '%s'" % format )
func = format_info[ 0 ]
for arg, val in format_info[ 1 ]:
kwargs[arg] = val
if format ! = 'zip' :
kwargs[ 'owner' ] = owner
kwargs[ 'group' ] = group
try :
filename = func(base_name, base_dir, * * kwargs)
finally :
if root_dir is not None :
if logger is not None :
logger.debug( "changing back to '%s'" , save_cwd)
os.chdir(save_cwd)
return filename
|
base_name: 压缩打包后的文件名或者路径名
format: 压缩或者打包格式 "zip", "tar", "bztar"or "gztar"
root_dir : 将哪个目录或者文件打包(也就是源文件)
1
2
3
4
5
6
7
8
|
>>> shutil.make_archive( 'tarball' , 'gztar' ,root_dir= 'copytree_test' )
[root@slyoyo python_test] # ls -l
total 12
drwxr-xr-x. 3 root root 4096 May 14 19:36 copytree_copy
drwxr-xr-x. 3 root root 4096 May 14 19:36 copytree_test
-rw-r--r--. 1 root root 0 May 14 21:12 tarball. tar .gz
-rw-r--r--. 1 python python 79 May 14 05:17 test1
-rw-r--r--. 1 root root 0 May 14 19:10 test2
|