xref: /OK3568_Linux_fs/kernel/scripts/cleanpatch (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun#!/usr/bin/env perl
2*4882a593Smuzhiyun# SPDX-License-Identifier: GPL-2.0
3*4882a593Smuzhiyun#
4*4882a593Smuzhiyun# Clean a patch file -- or directory of patch files -- of stealth whitespace.
5*4882a593Smuzhiyun# WARNING: this can be a highly destructive operation.  Use with caution.
6*4882a593Smuzhiyun#
7*4882a593Smuzhiyun
8*4882a593Smuzhiyunuse warnings;
9*4882a593Smuzhiyunuse bytes;
10*4882a593Smuzhiyunuse File::Basename;
11*4882a593Smuzhiyun
12*4882a593Smuzhiyun# Default options
13*4882a593Smuzhiyun$max_width = 79;
14*4882a593Smuzhiyun
15*4882a593Smuzhiyun# Clean up space-tab sequences, either by removing spaces or
16*4882a593Smuzhiyun# replacing them with tabs.
17*4882a593Smuzhiyunsub clean_space_tabs($)
18*4882a593Smuzhiyun{
19*4882a593Smuzhiyun    no bytes;			# Tab alignment depends on characters
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun    my($li) = @_;
22*4882a593Smuzhiyun    my($lo) = '';
23*4882a593Smuzhiyun    my $pos = 0;
24*4882a593Smuzhiyun    my $nsp = 0;
25*4882a593Smuzhiyun    my($i, $c);
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun    for ($i = 0; $i < length($li); $i++) {
28*4882a593Smuzhiyun	$c = substr($li, $i, 1);
29*4882a593Smuzhiyun	if ($c eq "\t") {
30*4882a593Smuzhiyun	    my $npos = ($pos+$nsp+8) & ~7;
31*4882a593Smuzhiyun	    my $ntab = ($npos >> 3) - ($pos >> 3);
32*4882a593Smuzhiyun	    $lo .= "\t" x $ntab;
33*4882a593Smuzhiyun	    $pos = $npos;
34*4882a593Smuzhiyun	    $nsp = 0;
35*4882a593Smuzhiyun	} elsif ($c eq "\n" || $c eq "\r") {
36*4882a593Smuzhiyun	    $lo .= " " x $nsp;
37*4882a593Smuzhiyun	    $pos += $nsp;
38*4882a593Smuzhiyun	    $nsp = 0;
39*4882a593Smuzhiyun	    $lo .= $c;
40*4882a593Smuzhiyun	    $pos = 0;
41*4882a593Smuzhiyun	} elsif ($c eq " ") {
42*4882a593Smuzhiyun	    $nsp++;
43*4882a593Smuzhiyun	} else {
44*4882a593Smuzhiyun	    $lo .= " " x $nsp;
45*4882a593Smuzhiyun	    $pos += $nsp;
46*4882a593Smuzhiyun	    $nsp = 0;
47*4882a593Smuzhiyun	    $lo .= $c;
48*4882a593Smuzhiyun	    $pos++;
49*4882a593Smuzhiyun	}
50*4882a593Smuzhiyun    }
51*4882a593Smuzhiyun    $lo .= " " x $nsp;
52*4882a593Smuzhiyun    return $lo;
53*4882a593Smuzhiyun}
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun# Compute the visual width of a string
56*4882a593Smuzhiyunsub strwidth($) {
57*4882a593Smuzhiyun    no bytes;			# Tab alignment depends on characters
58*4882a593Smuzhiyun
59*4882a593Smuzhiyun    my($li) = @_;
60*4882a593Smuzhiyun    my($c, $i);
61*4882a593Smuzhiyun    my $pos = 0;
62*4882a593Smuzhiyun    my $mlen = 0;
63*4882a593Smuzhiyun
64*4882a593Smuzhiyun    for ($i = 0; $i < length($li); $i++) {
65*4882a593Smuzhiyun	$c = substr($li,$i,1);
66*4882a593Smuzhiyun	if ($c eq "\t") {
67*4882a593Smuzhiyun	    $pos = ($pos+8) & ~7;
68*4882a593Smuzhiyun	} elsif ($c eq "\n") {
69*4882a593Smuzhiyun	    $mlen = $pos if ($pos > $mlen);
70*4882a593Smuzhiyun	    $pos = 0;
71*4882a593Smuzhiyun	} else {
72*4882a593Smuzhiyun	    $pos++;
73*4882a593Smuzhiyun	}
74*4882a593Smuzhiyun    }
75*4882a593Smuzhiyun
76*4882a593Smuzhiyun    $mlen = $pos if ($pos > $mlen);
77*4882a593Smuzhiyun    return $mlen;
78*4882a593Smuzhiyun}
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun$name = basename($0);
81*4882a593Smuzhiyun
82*4882a593Smuzhiyun@files = ();
83*4882a593Smuzhiyun
84*4882a593Smuzhiyunwhile (defined($a = shift(@ARGV))) {
85*4882a593Smuzhiyun    if ($a =~ /^-/) {
86*4882a593Smuzhiyun	if ($a eq '-width' || $a eq '-w') {
87*4882a593Smuzhiyun	    $max_width = shift(@ARGV)+0;
88*4882a593Smuzhiyun	} else {
89*4882a593Smuzhiyun	    print STDERR "Usage: $name [-width #] files...\n";
90*4882a593Smuzhiyun	    exit 1;
91*4882a593Smuzhiyun	}
92*4882a593Smuzhiyun    } else {
93*4882a593Smuzhiyun	push(@files, $a);
94*4882a593Smuzhiyun    }
95*4882a593Smuzhiyun}
96*4882a593Smuzhiyun
97*4882a593Smuzhiyunforeach $f ( @files ) {
98*4882a593Smuzhiyun    print STDERR "$name: $f\n";
99*4882a593Smuzhiyun
100*4882a593Smuzhiyun    if (! -f $f) {
101*4882a593Smuzhiyun	print STDERR "$f: not a file\n";
102*4882a593Smuzhiyun	next;
103*4882a593Smuzhiyun    }
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun    if (!open(FILE, '+<', $f)) {
106*4882a593Smuzhiyun	print STDERR "$name: Cannot open file: $f: $!\n";
107*4882a593Smuzhiyun	next;
108*4882a593Smuzhiyun    }
109*4882a593Smuzhiyun
110*4882a593Smuzhiyun    binmode FILE;
111*4882a593Smuzhiyun
112*4882a593Smuzhiyun    # First, verify that it is not a binary file; consider any file
113*4882a593Smuzhiyun    # with a zero byte to be a binary file.  Is there any better, or
114*4882a593Smuzhiyun    # additional, heuristic that should be applied?
115*4882a593Smuzhiyun    $is_binary = 0;
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun    while (read(FILE, $data, 65536) > 0) {
118*4882a593Smuzhiyun	if ($data =~ /\0/) {
119*4882a593Smuzhiyun	    $is_binary = 1;
120*4882a593Smuzhiyun	    last;
121*4882a593Smuzhiyun	}
122*4882a593Smuzhiyun    }
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun    if ($is_binary) {
125*4882a593Smuzhiyun	print STDERR "$name: $f: binary file\n";
126*4882a593Smuzhiyun	next;
127*4882a593Smuzhiyun    }
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun    seek(FILE, 0, 0);
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun    $in_bytes = 0;
132*4882a593Smuzhiyun    $out_bytes = 0;
133*4882a593Smuzhiyun    $lineno = 0;
134*4882a593Smuzhiyun
135*4882a593Smuzhiyun    @lines  = ();
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun    $in_hunk = 0;
138*4882a593Smuzhiyun    $err = 0;
139*4882a593Smuzhiyun
140*4882a593Smuzhiyun    while ( defined($line = <FILE>) ) {
141*4882a593Smuzhiyun	$lineno++;
142*4882a593Smuzhiyun	$in_bytes += length($line);
143*4882a593Smuzhiyun
144*4882a593Smuzhiyun	if (!$in_hunk) {
145*4882a593Smuzhiyun	    if ($line =~
146*4882a593Smuzhiyun		/^\@\@\s+\-([0-9]+),([0-9]+)\s+\+([0-9]+),([0-9]+)\s\@\@/) {
147*4882a593Smuzhiyun		$minus_lines = $2;
148*4882a593Smuzhiyun		$plus_lines = $4;
149*4882a593Smuzhiyun		if ($minus_lines || $plus_lines) {
150*4882a593Smuzhiyun		    $in_hunk = 1;
151*4882a593Smuzhiyun		    @hunk_lines = ($line);
152*4882a593Smuzhiyun		}
153*4882a593Smuzhiyun	    } else {
154*4882a593Smuzhiyun		push(@lines, $line);
155*4882a593Smuzhiyun		$out_bytes += length($line);
156*4882a593Smuzhiyun	    }
157*4882a593Smuzhiyun	} else {
158*4882a593Smuzhiyun	    # We're in a hunk
159*4882a593Smuzhiyun
160*4882a593Smuzhiyun	    if ($line =~ /^\+/) {
161*4882a593Smuzhiyun		$plus_lines--;
162*4882a593Smuzhiyun
163*4882a593Smuzhiyun		$text = substr($line, 1);
164*4882a593Smuzhiyun		$text =~ s/[ \t\r]*$//;		# Remove trailing spaces
165*4882a593Smuzhiyun		$text = clean_space_tabs($text);
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun		$l_width = strwidth($text);
168*4882a593Smuzhiyun		if ($max_width && $l_width > $max_width) {
169*4882a593Smuzhiyun		    print STDERR
170*4882a593Smuzhiyun			"$f:$lineno: adds line exceeds $max_width ",
171*4882a593Smuzhiyun			"characters ($l_width)\n";
172*4882a593Smuzhiyun		}
173*4882a593Smuzhiyun
174*4882a593Smuzhiyun		push(@hunk_lines, '+'.$text);
175*4882a593Smuzhiyun	    } elsif ($line =~ /^\-/) {
176*4882a593Smuzhiyun		$minus_lines--;
177*4882a593Smuzhiyun		push(@hunk_lines, $line);
178*4882a593Smuzhiyun	    } elsif ($line =~ /^ /) {
179*4882a593Smuzhiyun		$plus_lines--;
180*4882a593Smuzhiyun		$minus_lines--;
181*4882a593Smuzhiyun		push(@hunk_lines, $line);
182*4882a593Smuzhiyun	    } else {
183*4882a593Smuzhiyun		print STDERR "$name: $f: malformed patch\n";
184*4882a593Smuzhiyun		$err = 1;
185*4882a593Smuzhiyun		last;
186*4882a593Smuzhiyun	    }
187*4882a593Smuzhiyun
188*4882a593Smuzhiyun	    if ($plus_lines < 0 || $minus_lines < 0) {
189*4882a593Smuzhiyun		print STDERR "$name: $f: malformed patch\n";
190*4882a593Smuzhiyun		$err = 1;
191*4882a593Smuzhiyun		last;
192*4882a593Smuzhiyun	    } elsif ($plus_lines == 0 && $minus_lines == 0) {
193*4882a593Smuzhiyun		# End of a hunk.  Process this hunk.
194*4882a593Smuzhiyun		my $i;
195*4882a593Smuzhiyun		my $l;
196*4882a593Smuzhiyun		my @h = ();
197*4882a593Smuzhiyun		my $adj = 0;
198*4882a593Smuzhiyun		my $done = 0;
199*4882a593Smuzhiyun
200*4882a593Smuzhiyun		for ($i = scalar(@hunk_lines)-1; $i > 0; $i--) {
201*4882a593Smuzhiyun		    $l = $hunk_lines[$i];
202*4882a593Smuzhiyun		    if (!$done && $l eq "+\n") {
203*4882a593Smuzhiyun			$adj++; # Skip this line
204*4882a593Smuzhiyun		    } elsif ($l =~ /^[ +]/) {
205*4882a593Smuzhiyun			$done = 1;
206*4882a593Smuzhiyun			unshift(@h, $l);
207*4882a593Smuzhiyun		    } else {
208*4882a593Smuzhiyun			unshift(@h, $l);
209*4882a593Smuzhiyun		    }
210*4882a593Smuzhiyun		}
211*4882a593Smuzhiyun
212*4882a593Smuzhiyun		$l = $hunk_lines[0];  # Hunk header
213*4882a593Smuzhiyun		undef @hunk_lines;    # Free memory
214*4882a593Smuzhiyun
215*4882a593Smuzhiyun		if ($adj) {
216*4882a593Smuzhiyun		    die unless
217*4882a593Smuzhiyun			($l =~ /^\@\@\s+\-([0-9]+),([0-9]+)\s+\+([0-9]+),([0-9]+)\s\@\@(.*)$/);
218*4882a593Smuzhiyun		    my $mstart = $1;
219*4882a593Smuzhiyun		    my $mlin = $2;
220*4882a593Smuzhiyun		    my $pstart = $3;
221*4882a593Smuzhiyun		    my $plin = $4;
222*4882a593Smuzhiyun		    my $tail = $5; # doesn't include the final newline
223*4882a593Smuzhiyun
224*4882a593Smuzhiyun		    $l = sprintf("@@ -%d,%d +%d,%d @@%s\n",
225*4882a593Smuzhiyun				 $mstart, $mlin, $pstart, $plin-$adj,
226*4882a593Smuzhiyun				 $tail);
227*4882a593Smuzhiyun		}
228*4882a593Smuzhiyun		unshift(@h, $l);
229*4882a593Smuzhiyun
230*4882a593Smuzhiyun		# Transfer to the output array
231*4882a593Smuzhiyun		foreach $l (@h) {
232*4882a593Smuzhiyun		    $out_bytes += length($l);
233*4882a593Smuzhiyun		    push(@lines, $l);
234*4882a593Smuzhiyun		}
235*4882a593Smuzhiyun
236*4882a593Smuzhiyun		$in_hunk = 0;
237*4882a593Smuzhiyun	    }
238*4882a593Smuzhiyun	}
239*4882a593Smuzhiyun    }
240*4882a593Smuzhiyun
241*4882a593Smuzhiyun    if ($in_hunk) {
242*4882a593Smuzhiyun	print STDERR "$name: $f: malformed patch\n";
243*4882a593Smuzhiyun	$err = 1;
244*4882a593Smuzhiyun    }
245*4882a593Smuzhiyun
246*4882a593Smuzhiyun    if (!$err) {
247*4882a593Smuzhiyun	if ($in_bytes != $out_bytes) {
248*4882a593Smuzhiyun	    # Only write to the file if changed
249*4882a593Smuzhiyun	    seek(FILE, 0, 0);
250*4882a593Smuzhiyun	    print FILE @lines;
251*4882a593Smuzhiyun
252*4882a593Smuzhiyun	    if ( !defined($where = tell(FILE)) ||
253*4882a593Smuzhiyun		 !truncate(FILE, $where) ) {
254*4882a593Smuzhiyun		die "$name: Failed to truncate modified file: $f: $!\n";
255*4882a593Smuzhiyun	    }
256*4882a593Smuzhiyun	}
257*4882a593Smuzhiyun    }
258*4882a593Smuzhiyun
259*4882a593Smuzhiyun    close(FILE);
260*4882a593Smuzhiyun}
261