-
Notifications
You must be signed in to change notification settings - Fork 244
/
Copy pathbatchGitVersion.pm
331 lines (305 loc) · 11.8 KB
/
batchGitVersion.pm
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
#!/usr/bin/env perl
# Copyright (c) MediaTek USA Inc., 2023
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or (at
# your option) any later version.
#
# This program is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
# General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, see
# <http://www.gnu.org/licenses/>.
#
# This implementation creates an initial database to hold the version stamps
# for all files in the repo - then simply queries that DB during
# execution. See 'usage' for details:#
# .../batchGitVersion.pm --help
#
# This is a sample script which uses git commands to determine
# the version of the filename parameter.
# Version information (if present) is used during ".info" file merging
# to verify that the data the user is attempting to merge is for the same
# source code/same version.
# If the version is not the same - then line numbers, etc. may be different
# and some very strange errors may occur.
package batchGitVersion;
use strict;
use Getopt::Long qw(GetOptionsFromArray);
use File::Spec;
use File::Basename qw(dirname basename);
use Cwd qw/getcwd/;
use FindBin;
use lib "$FindBin::RealBin";
use annotateutil qw(get_modify_time not_in_repo compute_md5 call_get_version);
our @ISA = qw(Exporter);
our @EXPORT_OK = qw(new extract_version compare_version usage);
# should probably use "BLOB" as the token - so anyone we call can know that this
# is a blob sha - and can look up the file sha, if desired
my $shaToken = 'BLOB';
sub usage
{
my ($script, $help) = @_;
$script = $0 unless defined $script;
my $exe = basename $script;
print(STDERR<<EOF);
usage: $exe->new([--md5] [--allow-missing [--repo repo] \\
[--prepend path] [--prefix dir]* \\
[--token string] \\
[-v | --verbose]*)
$exe->extract_version(pathname)
$exe->compare(old_version, new_version, pathname)
EOF
if ($help) {
print(STDERR<<EOF);
The 'new' callback queries the git repo specified by 'repo'
(or \$CWD, if --repo is not supplied) and holds the data.
\$ $exe->new(...) # to initialize git_data
--md5 : return MD5 signature if pathname not found in repo
--allow-missing: if set: return empty string if pathname not found
otherwise: die (fatal error)
--repo dir : where to find the git repo
--prepend path : prepend path to names found in repo before storing
e.g., if path is 'x/y' and object 'dir/file' is found
in the repo, then 'x/y/dir/file' is stored.
--prefix dir : add dir to the list of directories to search, to find
pathname.
--token string : use string as the blob sha token in the version string.
default value is 'BLOB' - so application can
distinguish between SHA types - say, to complare
to compare a BLOB SHA to a file SHA.
For backward compatibility with earlier versions of
this script, use '--token SHA'.
-v | --verbose : increase verbosity
Setting the verbosity flag causes the script to print some (hopefully useful)
debug information - so you can see why your use is not working the way you
might have expected.
The second call queries DB to find 'pathname'.
- 'pathname' may be be a file name which is found in the git repo, but
with some prefix prepended. For example:
pathname: /build/directory/path/repo/dir/file
filename: repo/dir/file
- if script is called as
\$ $exe --prefix /build/directory/path my_git_data \
/build/directory/path/repo/dir/file
$shaToken git_sha_string
- zero or more --prefix arguments can be specified.
$exe will look at each, in the order specified.
- if pathname is not found in the DB:
- if pathname does not resolve to a file:
- '' (empty string) if '--allow-missing' flag used,
- else, error
- if '--md5' is passed: return MD5 checksum of the file
- else return file creation timestamp
NOTE: $exe DOES NOT CHECK FOR LOCAL CHANGES that are not checked in
to your git repo - so versions will compare as identical even
if the local file has been edited.
Please commit your changes before running $exe.
The third call passes two version strings which are expected to be the same.
Under normal circumstances, the version strings will have been returned by
some call(s) to $exe.
Exit status is 0 when files match, 1 otherwise.
To diagnose version mismatches using these SHAs:
- You can git diff them to see how they are different the same way you
'git diff' commit shas (except you do not to specify a file)
- You can 'git log commit1..commit2' because you should also store
the overall sha of these two points (again if the scripting just
wants to know the delta).
Again note: the normal git way of asking these types of questions is to
just store a single commit shas, unlike perforce/svn that exactly
represents the current files, 'git diff --name-status' can VERY quickly
tell you what has changed.
There is also a mechanism for determining which commits contain which
blobs given a file and a starting point. Again it is just easier
to use 'git log commit1..commit2'
EOF
} else {
print(STDERR "\n see '$exe --help' for more information\n");
}
}
use constant {
DB => 0,
PREFIX => 1,
MD5 => 2,
MISSING => 3,
VERBOSE => 4,
};
sub new
{
my $class = shift;
my $script = shift;
my $stand_alone = $0 eq $script;
# script should be me...
my $use_md5;
my $allow_missing;
my $repo;
my $prepend;
my @prefix;
my $help;
my $verbose = 0;
if (!GetOptionsFromArray(\@_,
("md5" => \$use_md5,
'prefix:s' => \@prefix,
'repo:s' => \$repo,
'allow-missing' => \$allow_missing,
'prepend:s' => \$prepend,
"verbose|v+" => \$verbose,
'token:s' => \$shaToken,
'help' => \$help,)) ||
($stand_alone && 0 != scalar(@_)) ||
$help
) {
usage($script, $help);
exit(defined($help) && 0 == scalar(@_) ? 0 : 1) if $stand_alone;
return undef;
}
my %db;
my $cd = $repo ? "cd $repo ;" : '';
open(GIT, '-|', "$cd git ls-tree -r --full-tree HEAD") or
die("unable to execute git: $!");
my @prepend;
if ($prepend) {
push(@prepend, $prepend);
}
my $errLeader = "unexpected git ls-tree entry:\n ";
my %submodule;
while (<GIT>) {
if (/^\d+\s+blob\s+(\S+)\s+(.+)$/) {
# line format: mode blob sha path
$db{File::Spec->catfile(@prepend, $2)} = $1;
} elsif (/^\d+\s+commit\s+(\S+)\s+(\S+)$/) {
# line format: mode commit sha path
die("duplicate submodule etnry for $2") if exists($submodule{$2});
$submodule{$2} = $1;
} else {
print(STDERR "$errLeader$_");
$errLeader = ' ';
}
}
close(GIT) or die("error on close $repo pipe: $!");
# now look for submodules
open(GIT, '-|',
"$cd git submodule foreach 'git ls-tree -r --full-tree HEAD ; echo done'")
or
die("unable to execute git: $!");
my $current;
my @stack;
my $number = 2;
my $countdown = $number * $verbose;
my $prefix = '';
while (<GIT>) {
if (/^\d+\s+blob\s+(\S+)\s+(.+)$/) {
# line format: mode blob sha path
die("unknown current submodule") unless defined($current);
$db{File::Spec->catfile(@prepend, $current, $2)} = $1;
if ($countdown) {
--$countdown;
print("${prefix}storing " .
File::Spec->catfile(@prepend, $current, $2) .
" => $1\n");
print("$prefix ...\n") unless $countdown;
}
} elsif (/^\d+\s+commit(\S+)\s+(\s+)$/) {
# line format: mode commit sha path
my $s = File::Spec->catfile(@prepend, $current, $2);
die("duplicate submodule etnry for $s") if exists($submodule{$s});
$submodule{$s} = $1;
} elsif (/^Entering '([^']+)'$/) {
$current = File::Spec->catfile(@stack, $1);
push(@stack, $1);
die("found unexpected submodule '$current'")
unless exists($submodule{$current});
$countdown = $number * $verbose;
if ($countdown) {
print("${prefix}enter submodule $current\n");
$prefix .= ' ';
}
} elsif (/^done$/) {
die("empty stack") unless @stack;
pop(@stack);
if (@stack) {
$current = File::Spec->catfile(@stack);
} else {
$current = undef;
}
if ($verbose) {
print("${prefix}exit submodule $current\n");
$prefix = substr($prefix, 2);
}
} else {
print(STDERR "$errLeader$_");
$errLeader = ' ';
}
}
close(GIT) or die("error on close submodule pipe: $!");
$repo = getcwd() unless $repo;
push(@prefix, $repo) unless grep(/^$repo/, @prefix);
# @todo enhancement: could look for local edits and store
# them into the DB here
foreach my $p (@prefix) {
# want all the prefixes to end with dir separator so we can
# just concat them
$p .= '/' unless substr($p, -1) eq '/';
}
my $self = [\%db, \@prefix, $use_md5, $allow_missing, $verbose];
return bless $self, $class;
}
sub extract_version
{
my ($self, $file) = @_;
my $db = $self->[DB];
my $prefix = $self->[PREFIX];
my $verbose = $self->[VERBOSE];
print("extract_version($file)\n") if $verbose;
if (@$prefix) {
# check we we can strip the prefix off the filename - to find it in the DB
foreach my $p (@$prefix) {
print(" check prefix $p ..\n") if $verbose;
if (0 == index($file, $p)) {
print(" .. match\n") if $verbose;
my $tail = substr($file, length($p));
if (exists($db->{$tail})) {
print(" .. found\n") if $verbose;
return $shaToken . ' ' . $db->{$tail};
}
}
}
}
if (exists($db->{$file})) {
print(" .. found\n") if $verbose;
return $shaToken . ' ' . $db->{$file};
}
unless (-e $file) {
if ($self->[MISSING]) {
return ''; # empty string
}
die("Error: $file does not exist - perhaps you need the '--allow-missing' flag"
);
}
my $version = get_modify_time($file);
$version .= ' md5:' . compute_md5($file)
if ($self->[MD5]);
return $version;
}
sub compare_version
{
my ($self, $new, $old, $file) = @_;
if ($self->[MD5] &&
$old !~ /^$shaToken/ &&
$old =~ / md5:(.+)$/) {
my $o = $1;
if ($new =~ / md5:(.+)$/) {
return ($o ne $1);
}
# otherwise: 'new' was not an MD5 signature - so fall through to exact match
}
return ($old ne $new); # just look for exact match
}
unless (caller) {
call_get_version("batchGitVersion", $0, @ARGV);
}
1;