-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathmulti_search_replace.py
303 lines (266 loc) · 11.9 KB
/
multi_search_replace.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
"""
Multi-file search and replace.
Usage:
python multi_search_replace.py folder_path string1 [string2 [safe [postfix [extension_list [exclude_file_list [include_file_list [verbose]]]]]]]
The resulting files are in a folder located in the same place as 'folder_path'
but named 'folder_path'+'postfix'.
TODO: create a setup.py with an entry point to have access to it from anywhere
TODO: Replace the positional argument type interface by an argparse or a traits
GUI
"""
import os
import shutil
import warnings
import numpy as np
def search_for_files(folder_path, extension_list = [".py"],
exclude_file_list = [], include_file_list = None,
verbose = False):
""" Recusively search for the eligible files containing string1.
Apply this to all files with extension in extension_list and that are
not in exclude_file_list.
If safe == True, a copy of the folder is created and both are kept
"""
if verbose:
print("Now exploring folder %s" % os.path.abspath(folder_path))
try:
content = os.listdir(folder_path)
except Exception as e:
raise IOError("The folder_path couldnt be found (exception: %s)" % e)
os.chdir(folder_path)
# list of files eligible for replacement
eligible_files = []
for member in content:
member = os.path.abspath(member)
#print "member", member
if os.path.isfile(member):
if file_to_apply(member, extension_list,
exclude_file_list = exclude_file_list,
include_file_list = include_file_list,
verbose = verbose):
print(" Adding %s to the eligible files"
% member)
eligible_files.append(os.path.abspath(member))
elif os.path.isdir(member):
eligible_files += search_for_files(
folder_path = member,
extension_list = extension_list,
exclude_file_list = exclude_file_list,
include_file_list = include_file_list,
verbose = verbose)
os.chdir(folder_path)
else:
print(" Skipping %s since it is neither a file nor a directory."
% os.path.abspath(member))
return eligible_files
################################################################################
# File selection
################################################################################
def file_to_apply(filename, extension_list = None, exclude_file_list = None,
include_file_list = None, verbose = False):
""" Test if a given file is eligible for a given action.
Must have the correct extension AND
- be in the include_file_list (with or without extension)
OR
- not be in the exclude_file_list (with or without extension)
if only 1 list is provided.
Returns:
- bool
"""
if extension_list is None:
extension_list = []
if exclude_file_list is None:
exclude_file_list = []
if include_file_list is None:
include_file_list = []
if verbose:
print " testing", filename
if include_file_list == [] and exclude_file_list == []:
condition = (os.path.splitext(filename)[1] in extension_list)
elif include_file_list != [] and exclude_file_list == []:
condition = (os.path.splitext(filename)[1] in extension_list
and (os.path.split(filename)[1] in include_file_list
or os.path.splitext(os.path.split(filename)[1])[0]
in include_file_list ))
elif include_file_list == [] and exclude_file_list != []:
condition = (os.path.splitext(filename)[1] in extension_list
and (os.path.split(filename)[1] not in exclude_file_list
or os.path.splitext(os.path.split(filename)[1])[0]
not in exclude_file_list))
else:
raise ValueError("Both an exclude list and include list were provided."
"Please clarify by using either or None. Currently, "
"include = %s, exclude = %s"
% (exclude_file_list, include_file_list))
return condition
def find_and_replace(filepath, new_filepath, string1, string2, verbose = False):
""" Search for a string1 inside a text file. Replace by string2 and write
into a new file whose filepath is returned.
"""
num_occurences = 0
if verbose:
print("Replacing '%s' by '%s' in %s ") % (string1,string2,filepath)
try:
f = open(filepath, "r")
except Exception as e:
raise IOError("Failed opening file with path %s with exception %s." %
(filepath, e))
content = f.read()
f.close()
num_occurences = content.count(string1)
if num_occurences:
new_content = content.replace(string1, string2)
if verbose:
print("*** Found %s occurences of %s in %s. ***" %
(num_occurences, string1, filepath))
with open(new_filepath, "w") as f:
f.write(new_content)
return num_occurences
################################################################################
# Main
################################################################################
def main(folder_path, string1, string2 = "", extension_list = [".py"],
exclude_file_list = [], include_file_list = None, safe = True,
postfix = "2", verbose = False):
""" Manages the search a replace behavior
"""
# Create a copy of the folder.
folder_path = os.path.abspath(folder_path)
containing_folder = os.path.split(folder_path)[1]
eligible_files = search_for_files(folder_path,
extension_list,
exclude_file_list = exclude_file_list,
include_file_list = include_file_list,
verbose = verbose)
if eligible_files:
occurences = np.empty(len(eligible_files), dtype = np.int)
# Create the whole directory structure. The eligible files will be
# overwritten later on
if safe:
target_folder = folder_path.replace(containing_folder,
containing_folder+postfix)
if os.path.exists(target_folder):
raise IOError("Target folder %s already exists. Aborting..." %
target_folder)
shutil.copytree(folder_path,target_folder)
for index, filename in enumerate(eligible_files):
if safe:
target_filename = filename.replace(folder_path,
target_folder)
if not os.path.exists(os.path.dirname(target_filename)):
raise RuntimeError("The target filename %s doesn't exist but "
"should. Investigate..." % target_filename)
elif target_filename == filename:
raise RuntimeError("The target filepath %s should be different from "
"the original filepath %s. Investigate..."
% (target_filename, filename))
else:
target_filename = filename
occurences[index] = find_and_replace(filename, target_filename, string1,
string2, verbose = verbose)
if occurences.max() == 0:
print "No occurence of the string requested was found."
return
################################################################################
# Formatting of inputs
################################################################################
def parse_string_list(string):
""" Converts a list in the form of a string to a list of strings. If the
argument given is not a list looking object ("[ something ]"), there is
only 1 element in the list so create a list with it.
"""
my_list = []
if string.startswith("[") and string.endswith("]"):
string = string.replace("[","")
string = string.replace("]","")
my_list = string.split(",")
if my_list == [""]:
my_list = []
else:
my_list = [string]
return my_list
def parse_extension_list(ext_list):
""" Make sure the list of extensions has the right format: each extension
must start with a dot. If it doesn't, add it. If the extension is 4
char or more, issue a warning.
"""
output = []
for ext in ext_list:
if len(ext) >= 4:
warnings.warn("The extension %s has more than 4 characters: was "
"that a typo?")
if ext.startswith("."):
output.append(ext)
else:
output.append("."+ext)
return output
################################################################################
# Interface
################################################################################
if __name__ == "__main__":
import sys
DEFAULT_VERBOSE = True
DEFAULT_SAFE = True
if len(sys.argv) < 3:
raise OSError("3 arguments must be provided to the multi-search-replace"
" utility. \nUsage:\n python multi_search_replace.py "
"folder_path string1 [string2 [safe [postfix "
"[extension_list [exclude_file_list [include_file_list "
"[verbose]]]]]]]")
else:
folder_path = sys.argv[1]
string1 = sys.argv[2]
if len(sys.argv) >= 4:
string2 = sys.argv[3]
if len(sys.argv) >= 5:
safe = eval(sys.argv[4])
if len(sys.argv) >= 6:
postfix = sys.argv[5]
if len(sys.argv) >= 7:
extension_list = parse_extension_list(
parse_string_list(sys.argv[6]))
if len(sys.argv) >= 8:
exclude_file_list = parse_string_list(sys.argv[7])
if len(sys.argv) >= 9:
include_file_list = parse_string_list(
sys.argv[8])
if len(sys.argv) >= 10:
verbose = bool(sys.argv[9])
else:
verbose = DEFAULT_VERBOSE
else:
verbose = DEFAULT_VERBOSE
include_file_list = []
else:
verbose = DEFAULT_VERBOSE
include_file_list = []
exclude_file_list = []
else:
verbose = DEFAULT_VERBOSE
include_file_list = []
exclude_file_list = []
extension_list = [".py"]
else:
verbose = DEFAULT_VERBOSE
include_file_list = []
exclude_file_list = []
extension_list = [".py"]
postfix = "2"
else:
verbose = DEFAULT_VERBOSE
include_file_list = []
exclude_file_list = []
extension_list = [".py"]
postfix = "2"
safe = DEFAULT_SAFE
else:
verbose = DEFAULT_VERBOSE
include_file_list = []
exclude_file_list = []
extension_list = [".py"]
postfix = "2"
safe = DEFAULT_SAFE
string2 = ""
main(folder_path = folder_path, string1 = string1, string2 = string2,
safe = safe, extension_list = extension_list, exclude_file_list =
exclude_file_list, include_file_list = include_file_list,
verbose = verbose)