本文实例讲述了python实现的用于搜索文件并进行内容替换的类。分享给大家供大家参考。具体实现方法如下:
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
|
#!/usr/bin/python -O
# coding: UTF-8
"""
-replace string in files (recursive)
-display the difference.
v0.2
- search_string can be a re.compile() object -> use re.sub for replacing
v0.1
- initial version
Useable by a small "client" script, e.g.:
-------------------------------------------------------------------------------
#!/usr/bin/python -O
# coding: UTF-8
import sys, re
#sys.path.insert(0,"/path/to/git/repro/") # Please change path
from replace_in_files import SearchAndReplace
SearchAndReplace(
search_path = "/to/the/files/",
# e.g.: simple string replace:
search_string = 'the old string',
replace_string = 'the new string',
# e.g.: Regular expression replacing (used re.sub)
#search_string = re.compile('{% url (.*?) %}'),
#replace_string = "{% url '\g<1>' %}",
search_only = True, # Display only the difference
#search_only = False, # write the new content
file_filter=("*.py",), # fnmatch-Filter
)
-------------------------------------------------------------------------------
:copyleft: 2009-2011 by Jens Diemer
"""
__author__ = "Jens Diemer"
__license__ = """GNU General Public License v3 or above -
http://www.opensource.org/licenses/gpl-license.php"""
__url__ = "http://www.jensdiemer.de"
__version__ = "0.2"
import os, re, time, fnmatch, difflib
# FIXME: see http://*.com/questions/4730121/cant-get-an-objects-class-name-in-python
RE_TYPE = type (re. compile (""))
class SearchAndReplace( object ):
def __init__( self , search_path, search_string, replace_string,
search_only = True , file_filter = ( "*.*" ,)):
self .search_path = search_path
self .search_string = search_string
self .replace_string = replace_string
self .search_only = search_only
self .file_filter = file_filter
assert isinstance ( self .file_filter, ( list , tuple ))
# FIXME: see http://*.com/questions/4730121/cant-get-an-objects-class-name-in-python
self .is_re = isinstance ( self .search_string, RE_TYPE)
print "Search '%s' in [%s]..." % (
self .search_string, self .search_path
)
print "_" * 80
time_begin = time.time()
file_count = self .walk()
print "_" * 80
print "%s files searched in %0.2fsec." % (
file_count, (time.time() - time_begin)
)
def walk( self ):
file_count = 0
for root, dirlist, filelist in os.walk( self .search_path):
if ".svn" in root:
continue
for filename in filelist:
for file_filter in self .file_filter:
if fnmatch.fnmatch(filename, file_filter):
self .search_file(os.path.join(root, filename))
file_count + = 1
return file_count
def search_file( self , filepath):
f = file (filepath, "r" )
old_content = f.read()
f.close()
if self .is_re or self .search_string in old_content:
new_content = self .replace_content(old_content, filepath)
if self .is_re and new_content = = old_content:
return
print filepath
self .display_plaintext_diff(old_content, new_content)
def replace_content( self , old_content, filepath):
if self .is_re:
new_content = self .search_string.sub( self .replace_string, old_content)
if new_content = = old_content:
return old_content
else :
new_content = old_content.replace(
self .search_string, self .replace_string
)
if self .search_only ! = False :
return new_content
print "Write new content into %s..." % filepath,
try :
f = file (filepath, "w" )
f.write(new_content)
f.close()
except IOError, msg:
print "Error:" , msg
else :
print "OK"
print
return new_content
def display_plaintext_diff( self , content1, content2):
"""
Display a diff.
"""
content1 = content1.splitlines()
content2 = content2.splitlines()
diff = difflib.Differ().compare(content1, content2)
def is_diff_line(line):
for char in ( "-" , "+" , "?" ):
if line.startswith(char):
return True
return False
print "line | text\n-------------------------------------------"
old_line = ""
in_block = False
old_lineno = lineno = 0
for line in diff:
if line.startswith( " " ) or line.startswith( "+" ):
lineno + = 1
if old_lineno = = lineno:
display_line = "%4s | %s" % ("", line.rstrip())
else :
display_line = "%4s | %s" % (lineno, line.rstrip())
if is_diff_line(line):
if not in_block:
print "..."
# Display previous line
print old_line
in_block = True
print display_line
else :
if in_block:
# Display the next line aber a diff-block
print display_line
in_block = False
old_line = display_line
old_lineno = lineno
print "..."
if __name__ = = "__main__" :
SearchAndReplace(
search_path = "." ,
# e.g.: simple string replace:
search_string = 'the old string' ,
replace_string = 'the new string' ,
# e.g.: Regular expression replacing (used re.sub)
#search_string = re.compile('{% url (.*?) %}'),
#replace_string = "{% url '\g<1>' %}",
search_only = True , # Display only the difference
# search_only = False, # write the new content
file_filter = ( "*.py" ,), # fnmatch-Filter
)
|
希望本文所述对大家的Python程序设计有所帮助。