1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
|
#!/usr/bin/python
#
# Copyright (C) 2009 - Curtis Hovey <sinzui.is at verizon.net>
# This software is licensed under the GNU General Public License version 2.
#
# It comes from the Gedit Developer Plugins project (launchpad.net/gdp); see
# http://bazaar.launchpad.net/~sinzui/gdp/trunk/files/head%3A/plugins/gdp/ &
# http://bazaar.launchpad.net/%7Esinzui/gdp/trunk/annotate/head%3A/COPYING.
"""Find in files and replace strings in many files."""
import mimetypes
from optparse import OptionParser
import os
import re
import sys
mimetypes.init()
def extract_match(file_path, match_re, substitution=None):
"""Return a summary of matches in a file."""
lines = []
content = []
match = None
file_ = open(file_path, 'r')
try:
for lineno, line in enumerate(file_):
match = match_re.search(line)
if match:
lines.append(
{'lineno': lineno + 1, 'text': line.strip(),
'match': match})
if substitution is not None:
line = match_re.sub(substitution, line)
if substitution is not None:
content.append(line)
finally:
file_.close()
if lines:
if substitution is not None:
file_ = open(file_path, 'w')
try:
file_.write(''.join(content))
finally:
file_.close()
return {'file_path': file_path, 'lines': lines}
return None
def find_matches(root_dir, file_pattern, match_pattern,
substitution=None, extract_match=extract_match):
"""Iterate a summary of matching lines in a file."""
match_re = re.compile(match_pattern)
for file_path in find_files(root_dir, file_pattern=file_pattern):
summary = extract_match(
file_path, match_re, substitution=substitution)
if summary:
yield summary
def find_files(root_dir, skip_dir_pattern='^[.]', file_pattern='.*'):
"""Iterate the matching files below a directory."""
skip_dir_re = re.compile(r'^.*%s' % skip_dir_pattern)
file_re = re.compile(r'^.*%s' % file_pattern)
for path, subdirs, files in os.walk(root_dir):
subdirs[:] = [dir_ for dir_ in subdirs
if skip_dir_re.match(dir_) is None]
for file_ in files:
file_path = os.path.join(path, file_)
if os.path.islink(file_path):
continue
mime_type, encoding = mimetypes.guess_type(file_)
if mime_type is None or 'text/' in mime_type:
if file_re.match(file_path) is not None:
yield file_path
def get_option_parser():
"""Return the option parser for this program."""
usage = "usage: %prog [options] root_dir file_pattern match"
parser = OptionParser(usage=usage)
parser.add_option(
"-s", "--substitution", dest="substitution",
help="The substitution string (may contain \\[0-9] match groups).")
parser.set_defaults(substitution=None)
return parser
def main(argv=None):
"""Run the command line operations."""
if argv is None:
argv = sys.argv
parser = get_option_parser()
(options, args) = parser.parse_args(args=argv[1:])
root_dir = args[0]
file_pattern = args[1]
match_pattern = args[2]
substitution = options.substitution
print "Looking for [%s] in files like %s under %s:" % (
match_pattern, file_pattern, root_dir)
for summary in find_matches(
root_dir, file_pattern, match_pattern, substitution=substitution):
print "\n%(file_path)s" % summary
for line in summary['lines']:
print " %(lineno)4s: %(text)s" % line
if __name__ == '__main__':
sys.exit(main())
|