-
Notifications
You must be signed in to change notification settings - Fork 11
/
preplace
executable file
·194 lines (175 loc) · 5.62 KB
/
preplace
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
#!/usr/bin/env perl
# preplace: timestamp-preserving regular expression replacement.
# See usage() immediately below for usage information.
sub usage () {
print STDERR <<END_OF_USAGE;
preplace: timestamp-preserving Perl-style regular expression replacement.
Invoke like:
preplace [options] oldregex newreplacement [files]
If the files are omitted, all files under the current directory are used.
If a given file is a directory, then all files under it are used.
Args are:
-name regex only consider files whose names match the Perl regex;
applicable only if a list of files was not explicitly given
-i.bak back up each file with extension ".bak"
-preserve preserve the old timestamp even if replacement occurs
-- end of command-line options; regexes follow (optional);
use this if OLDREGEX starts with a hyphen
-help print this message
-debug print debugging output
This is like
perl -pi -e 's/OLD/NEW/g'
except that it applies to all files recursively and the timestamp on each file
is updated only if the replacement is performed. If the replacement is not
performed (because the old regular expression did not match in the file), then
the timestamp is unmodified. Thus, you can call it on as many files as you like
without losing the historical information about when a file was last modified.
END_OF_USAGE
}
# Called from the shell, it could be emulated as:
# find . -type f -name '*.html' -print \
# | xargs grep -l -P 'OLD' \
# | xargs perl -pi.bak -e 's|OLD|NEW|g'
# or as (with sed, not Perl, regular expression syntax):
# sed -i.bak 's/oldText/newText/g' `grep -ril 'oldText'`
# Problem: it only works for replacements on a single line; the OLD text
# cannot span lines (though the NEW text can).
use strict;
use English;
$WARNING = 1;
use Cwd 'abs_path';
use File::Find;
# use "-debug" switch to set
my $debug = 0;
my $fileregex;
my $backupsuffix = "";
my $preservedate = 0;
my $fromregex;
my $toregex;
my @filelist;
my $shortprogname = $0;
$shortprogname =~ s|.*/||;
my $forhelp = "for help, run: $shortprogname -help";
while ((scalar(@ARGV) > 0) && ($ARGV[0] =~ /^-/)) {
my $arg = shift @ARGV;
if ($arg =~ /^-i/) {
$backupsuffix = substr($arg, 2);
} elsif ($arg eq "-name") {
if (scalar(@ARGV) == 0) {
die "'-name' option requires an argument; $forhelp\n";
}
$fileregex = (shift @ARGV);
} elsif ($arg eq "-preserve") {
$preservedate = 1;
} elsif ($arg eq "--") {
last;
} elsif ($arg eq "-help") {
usage();
exit();
} elsif ($arg eq "-debug") {
$debug = 1;
} else {
die "preplace: unrecognized argument '$arg'; if OLDREGEX starts with a hyphen, precede it by '--'; $forhelp\n";
}
}
if (scalar(@ARGV) < 2) {
die "Not enough arguments (at least 2 required).\n$forhelp\n";
}
$fromregex = shift @ARGV;
$toregex = shift @ARGV;
if ($debug) {
print STDERR "fromregex = $fromregex\n";
print STDERR "toregex = $toregex\n";
}
# Subroutine to set @filelist. It's a callback; File::Find ignores its
# return value.
sub collect {
my $fullname = $File::Find::name;
if ($debug) {
print STDERR "collect considering $fullname\n";
# my $result = (-f $fullname);
# if (!defined($result)) { $result = 0; }
# print STDERR "-f $fullname = $result\n";
}
# Never consider version control directories.
# (This needs to be documented and customizable.)
if ((-d $fullname)
&& ($_ =~ /^(\.bzr|CVS|\.git|\.hg|\.svn)$/)) {
$File::Find::prune = 1;
}
if ((-f $fullname)
&& ((! defined($fileregex)) || ($fullname =~ /$fileregex/o))) {
if ($debug) {
print STDERR "collected $fullname\n";
}
push(@filelist, $fullname);
}
}
if (scalar(@ARGV) == 0) {
push @ARGV, ".";
}
# Must pass an absolute filename, not ".", to collect(), because flags like "-e"
# and "-f" fail if a filename starts with "./" and contains any other "/".
my $pwd = `pwd`;
chomp($pwd);
@filelist = ();
for my $arg (@ARGV) {
if ($arg eq ".") { $arg = $pwd; }
$arg =~ s|^\./|$pwd/|;
# Occurrences of abs_path() are because -f doesn't work on relative paths.
if (-d $arg) {
find(\&collect, abs_path($arg));
} elsif (-f abs_path($arg)) {
push @filelist, abs_path($arg);
} else {
print STDERR "argument $arg is neither a file nor a directory\n";
}
}
if ($debug) {
print STDERR "filelist: @filelist\n";
}
foreach my $file (@filelist) {
if ($debug) {
print STDERR "file: <<$file>>\n";
}
if (! open(SEARCH, $file)) {
print STDERR "Can't open file $file for read: $!\n";
next;
}
my $match = 0;
my $line;
while (defined($line = <SEARCH>)) {
if ($line =~ /$fromregex/o) {
$match = 1;
last;
}
}
close(SEARCH);
if ($match) {
# Should rewrite in perl rather than invoking external command, I suppose.
my $delimiter;
my $fromtoregex = $fromregex . $toregex;
if ($fromtoregex !~ m|/|) {
$delimiter = "/";
} elsif ($fromtoregex !~ m/\|/) {
$delimiter = "|";
} elsif ($fromtoregex !~ m/:/) {
$delimiter = ":";
} elsif ($fromtoregex !~ m/#/) {
$delimiter = "#";
} else {
die "Cannot choose delimiter; regexes use too many special characters";
}
# Quote $file in case it contains whitespace.
# Unfortunately, if the from or to regex contains a single quote, then the command is mangled.
my $command = "perl -pi$backupsuffix -e 'use strict; s$delimiter$fromregex$delimiter$toregex${delimiter}g' '$file'";
if ($debug) {
print STDERR "command: $command\n";
}
my ($atime, $mtime) = (stat($file))[8,9];
system($command);
if ($preservedate) {
utime $atime, $mtime, $file;
}
}
}