]>
Commit | Line | Data |
---|---|---|
7ebf9245 MM |
1 | #!/usr/bin/perl -w |
2 | # | |
3 | ||
482655f9 | 4 | $commits_list = "pld-cvs-commit\@pld-linux.org"; |
7ebf9245 | 5 | |
b5c674c5 | 6 | $spool_dir = "./spool"; |
01806192 MM |
7 | $copy_dir = "src"; # relative to ftp root |
8 | $no_url_dir = "./upload"; | |
9 | $df_server = "distfiles.pld-linux.org"; | |
10 | $df_scp = "plddist\@$df_server:ftp"; | |
7ebf9245 MM |
11 | |
12 | @md5 = (); | |
13 | %url = (); | |
14 | $problems = ""; | |
15 | $normal_out = ""; | |
16 | $requester = ""; | |
17 | $file = ""; | |
47f8fda7 MM |
18 | $fetched_count = 0; |
19 | $force_reply = 0; | |
bca91c1b | 20 | $req_login = "nobody"; |
44cd280f | 21 | @files = (); |
7ebf9245 MM |
22 | |
23 | # try lookup some file in spool, exit if it cannot be done | |
24 | sub find_file_in_spool() | |
25 | { | |
26 | opendir(DIR, $spool_dir) || die "can't opendir $spool_dir: $!"; | |
27 | while (1) { | |
28 | my $f = readdir(DIR); | |
29 | defined $f or last; | |
30 | -f "$spool_dir/$f" or next; | |
31 | $file = "$spool_dir/$f"; | |
32 | last; | |
33 | } | |
34 | closedir(DIR); | |
35 | ||
36 | exit 0 if ($file eq ""); | |
37 | } | |
38 | ||
39 | # read file from spool, and try unlink it. if cannot unlink -- exit | |
40 | # sets $requester (email), $problems, @md5 (arrays of md5's) | |
41 | # and %url (map from md5 to urls) | |
42 | sub read_spool_file() | |
43 | { | |
44 | open(F, "< $file") || exit 0; | |
45 | $requester = <F>; | |
46 | chomp $requester; | |
47 | $requester =~ /^[a-zA-Z_\-0-9\@\.]+$/ | |
48 | or die "$file: evil requester: $requester"; | |
bca91c1b MM |
49 | $req_login = ""; |
50 | $requester =~ /^([^@]+)\@/ and $req_login = $1; | |
51 | $req_login =~ /^[a-z0-9A-Z_]+$/ or die "$file: evil requester $requester"; | |
47f8fda7 MM |
52 | my $flags = <F>; |
53 | $force_reply++ if ($flags =~ /force-reply/); | |
7ebf9245 MM |
54 | |
55 | while (<F>) { | |
56 | if (/^ERROR/) { | |
57 | s/^ERROR: //; | |
58 | $problems .= $_; | |
f2a640bf | 59 | next; |
7ebf9245 | 60 | } |
43cbc90f | 61 | /^([a-f0-9]{32})\s+((ftp|http|no-url|no-url-copy):\/\/([=\@\?a-z0-9A-Z:\+\~\.\-\/_]|\%[0-9])+)\s*$/ |
7ebf9245 MM |
62 | or die "$file: corrupted"; |
63 | push @md5, $1; | |
64 | $url{$1} = $2; | |
65 | /\/$/ and die "$file: cannot fetch dir"; | |
66 | } | |
67 | close(F); | |
68 | ||
69 | unlink($file) || exit 0; | |
70 | } | |
71 | ||
44cd280f MM |
72 | sub basename($) |
73 | { | |
74 | my $f = shift; | |
75 | $f =~ s|.*/||; | |
76 | return $f; | |
77 | } | |
78 | ||
01806192 | 79 | sub by_md5($$) |
7ebf9245 MM |
80 | { |
81 | my ($md5, $url) = @_; | |
7ebf9245 | 82 | $md5 =~ /^(.)(.)/; |
01806192 | 83 | return "/by-md5/$1/$2/$md5/" . basename($url); |
6ce39ee7 MM |
84 | } |
85 | ||
01806192 | 86 | sub got_on_distfiles($$) |
6ce39ee7 | 87 | { |
01806192 MM |
88 | my ($md5, $url) = @_; |
89 | my $p = by_md5($md5, $url); | |
90 | my $l = `lftp -c 'debug 0; open $df_server; quote size $p'`; | |
91 | return $l =~ /^213 /; | |
92 | } | |
93 | ||
94 | sub copy_to_df($$) | |
95 | { | |
96 | my ($from, $to) = @_; | |
97 | my $cmd = "scp -r -B -q $from $df_scp/$to"; | |
98 | open(E, "$cmd 2>&1 |") or die; | |
99 | my $oops = ""; | |
100 | while (<E>) { | |
101 | $oops .= $_; | |
102 | } | |
103 | close(E); | |
104 | $problems .= "scp problems: $cmd:\n$oops\n" | |
105 | if ($oops ne ""); | |
106 | return ($oops ne ""); | |
6ce39ee7 MM |
107 | } |
108 | ||
b5c674c5 | 109 | sub move_file($$$) |
6ce39ee7 | 110 | { |
b5c674c5 | 111 | my ($md5, $url, $local_copy) = @_; |
6ce39ee7 | 112 | |
01806192 | 113 | my $bn = basename($url); |
6ce39ee7 | 114 | |
01806192 MM |
115 | if ($local_copy ne "$tmp_dir/$md5/$bn") { |
116 | if (system("mv -f \"$local_copy\" \"$tmp_dir/$md5/$bn\"")) { | |
117 | $problems .= "FATAL: cannot move $local_copy to $tmp_dir\n"; | |
118 | return; | |
119 | } | |
120 | $local_copy = "$tmp_dir/$md5/$bn"; | |
121 | } | |
6ce39ee7 | 122 | |
01806192 MM |
123 | if (open(D, "> $tmp_dir/$md5/$bn.desc")) { |
124 | print D "URL: $url\n"; | |
d286a317 | 125 | print D "Login: $req_login\n"; |
01806192 MM |
126 | print D "MD5: $md5\n"; |
127 | print D 'Fetched-by: $Id$'."\n"; | |
128 | print D "Time: " . time . "\n"; | |
129 | close(D); | |
7ebf9245 | 130 | } else { |
01806192 MM |
131 | $problems .= "ERROR: cannot write $bn.desc\n"; |
132 | } | |
133 | ||
134 | my $dir = by_md5($md5, $url); | |
135 | $dir =~ s|/[^/]+/[^/]+$||; | |
136 | if (copy_to_df("$tmp_dir/$md5/", $dir) == 0) { | |
44cd280f MM |
137 | $normal_out .= |
138 | "STORED: $url\n" . | |
139 | "\t$md5 " . basename($url) . "\n" . | |
01806192 | 140 | "\tSize: " . (-s $local_copy) . " bytes\n"; |
47f8fda7 | 141 | $fetched_count++; |
7ebf9245 MM |
142 | } |
143 | } | |
144 | ||
b5c674c5 MM |
145 | sub make_src_symlink($$) |
146 | { | |
147 | my ($md5, $url) = @_; | |
01806192 MM |
148 | |
149 | return unless ($url =~ /^no-url/); | |
150 | ||
151 | my $b = basename($url); | |
152 | if (open(S, "> $tmp_dir/$b.link")) { | |
b5c674c5 | 153 | if ($url =~ /^no-url-copy/) { |
01806192 | 154 | print S (".." . by_md5($md5, $url)); |
b5c674c5 | 155 | } else { |
01806192 | 156 | print S "REMOVE"; |
b5c674c5 | 157 | } |
01806192 MM |
158 | close(S); |
159 | copy_to_df("$tmp_dir/$b.link", "$copy_dir/$b.link"); | |
b5c674c5 | 160 | } else { |
01806192 | 161 | $problems .= "ERROR: cannot write $tmp_dir/$b.link\n"; |
b5c674c5 MM |
162 | } |
163 | } | |
164 | ||
165 | sub md5($) | |
166 | { | |
167 | my $file = shift; | |
168 | my $md5 = `md5sum "$file" 2>/dev/null`; | |
169 | $md5 =~ /^([a-f0-9]{32})/ and $md5 = $1; | |
170 | return $md5; | |
171 | } | |
172 | ||
173 | sub handle_no_url($$) | |
174 | { | |
175 | my ($md5, $url) = @_; | |
176 | ||
177 | $url =~ m|://([^/]+)| or die "corrupted! (no-url)"; | |
178 | my $basename = $1; | |
bca91c1b | 179 | my $file = "$no_url_dir/$req_login/$basename"; |
b5c674c5 MM |
180 | |
181 | if (-f $file) { | |
182 | my $computed_md5 = md5($file); | |
183 | if ($computed_md5 ne $md5) { | |
184 | $problems .= "FATAL: $file md5 mismatch, needed $md5, got $computed_md5\n"; | |
185 | } else { | |
186 | move_file($md5, $url, $file); | |
187 | make_src_symlink($md5, $url); | |
188 | } | |
189 | } else { | |
bca91c1b | 190 | $problems .= "FATAL: $file was not uploaded\n"; |
b5c674c5 MM |
191 | } |
192 | } | |
193 | ||
7ebf9245 MM |
194 | sub fetch_file($$) |
195 | { | |
196 | my ($md5, $url) = @_; | |
197 | my $out = ""; | |
08ea99b9 | 198 | my $all_out = ""; |
01806192 MM |
199 | my $bn = basename($url); |
200 | my $local = "$tmp_dir/$md5/$bn"; | |
201 | my $cmd = "wget -nv -O $local \"$url\""; | |
c0467b40 | 202 | my $cmd2 = "wget -nv --passive-ftp -O $local \"$url\""; |
b5c674c5 | 203 | |
01806192 | 204 | push @files, $bn; |
44cd280f | 205 | |
01806192 | 206 | if (got_on_distfiles($md5, $url)) { |
00eefa39 MM |
207 | $normal_out .= |
208 | "ALREADY GOT: $url\n" . | |
01806192 | 209 | "\t$md5 " . basename($url) . "\n"; |
b5c674c5 | 210 | make_src_symlink($md5, $url); |
6ce39ee7 MM |
211 | return; |
212 | } | |
01806192 MM |
213 | |
214 | mkdir("$tmp_dir/$md5") or die; | |
215 | ||
b5c674c5 MM |
216 | if ($url =~ /^no-url/) { |
217 | handle_no_url($md5, $url); | |
218 | return; | |
219 | } | |
220 | ||
7ebf9245 MM |
221 | open(W, "$cmd 2>&1 |"); |
222 | while (<W>) { | |
08ea99b9 | 223 | $all_out .= $_; |
7ebf9245 MM |
224 | /URL:.*\s+\-\>\s+.*/ and next; |
225 | $out .= $_; | |
226 | } | |
227 | close(W); | |
228 | if ($out ne "") { | |
229 | $problems .= "$cmd:\n$out\n\n"; | |
230 | } | |
e23ae36a | 231 | if (-f $local && -s $local == 0 && $url =~ /^ftp:/) { |
f4f705aa | 232 | $out = ""; |
c0467b40 | 233 | open(W, "$cmd2 2>&1 |"); |
234 | while (<W>) { | |
f4f705aa | 235 | $all_out .= "\n\t\t$_"; |
c0467b40 | 236 | /URL:.*\s+\-\>\s+.*/ and next; |
237 | $out .= $_; | |
238 | } | |
239 | close(W); | |
240 | if ($out ne "") { | |
241 | $problems .= "$cmd:\n$out\n\n"; | |
242 | } | |
243 | } | |
4db63fc1 | 244 | if (-r $local && -s $local > 0) { |
01806192 | 245 | my $computed_md5 = md5($local); |
7ebf9245 MM |
246 | if ($computed_md5 ne $md5) { |
247 | $problems .= "FATAL: $url md5 mismatch, needed $md5, got $computed_md5\n"; | |
248 | } else { | |
d642cf7e | 249 | my $testcmd = "file \"$local\" |"; |
250 | my $testres = ""; | |
251 | if ($url =~ /^http:/ && $local =~ /\.(tar\.(bz2|gz)|tgz|zip|jar|xpi)$/) { | |
252 | open(T, $testcmd) or die; | |
253 | $testres = <T>; | |
254 | close(T); | |
255 | } | |
256 | if ($testres =~ /empty|(ASCII|HTML|SGML).*text/) { | |
257 | $testres =~ s/.*://; | |
258 | $problems .= "FATAL: data returned from $url: $testres"; | |
259 | } else { | |
260 | move_file($md5, $url, $local); | |
261 | } | |
7ebf9245 | 262 | } |
4db63fc1 | 263 | } elsif (-f $local && -s $local > 0) { |
264 | $problems .= "FATAL: $url ($md5) was not fetched ($cmd: $all_out): file is not readable\n"; | |
7ebf9245 | 265 | } else { |
08ea99b9 | 266 | $problems .= "FATAL: $url ($md5) was not fetched ($cmd: $all_out)\n"; |
7ebf9245 | 267 | } |
01806192 MM |
268 | # save space |
269 | unlink($local); | |
7ebf9245 MM |
270 | } |
271 | ||
272 | sub fetch_files() | |
273 | { | |
274 | $problems .= "\n\n" if ($problems ne ""); | |
275 | foreach $md5 (@md5) { | |
276 | fetch_file($md5, $url{$md5}); | |
277 | } | |
278 | } | |
279 | ||
280 | sub send_email() | |
281 | { | |
9a1e36f3 MM |
282 | open(EMAIL, "| /usr/sbin/sendmail -t"); |
283 | #open(EMAIL, "| cat"); | |
44cd280f | 284 | my $marker = ""; |
7ebf9245 | 285 | if ($problems ne "") { |
44cd280f | 286 | $marker = "ERRORS: "; |
7ebf9245 | 287 | } |
04550b88 MM |
288 | my $req_login; |
289 | $requester =~ /^(.*)\@/ and $req_login = $1; | |
44cd280f MM |
290 | |
291 | splice(@files, 10, @files - 10, "...") | |
292 | if (@files > 10); | |
293 | ||
e157986d | 294 | print EMAIL |
04550b88 | 295 | "From: $req_login <$requester> |
482655f9 MM |
296 | To: $commits_list |
297 | Cc: $requester | |
44cd280f | 298 | Subject: DISTFILES: ${marker}@{files} |
e157986d MM |
299 | Message-ID: <$$." . time . "\@distfiles.pld-linux.org> |
300 | X-distfiles-program: file-fetcher.pl | |
301 | X-distfiles-version: " . '$Id$' . " | |
7ebf9245 MM |
302 | |
303 | $problems | |
47f8fda7 MM |
304 | Files fetched: $fetched_count |
305 | ||
7ebf9245 | 306 | $normal_out |
e157986d MM |
307 | |
308 | -- | |
d8cd573c | 309 | Virtually Yours: distfiles. |
7ebf9245 MM |
310 | "; |
311 | close(EMAIL) or die; | |
312 | } | |
313 | ||
01806192 MM |
314 | sub make_tmp_dir() |
315 | { | |
316 | my $id = `uuidgen 2>/dev/null`; | |
317 | chomp $id; | |
318 | $id = rand if (!defined $id or $id eq ""); | |
319 | $tmp_dir = "./tmp/$id"; | |
320 | mkdir($tmp_dir) or die; | |
321 | } | |
322 | ||
323 | sub clean_tmp_dir() | |
324 | { | |
325 | system("rm -rf $tmp_dir") | |
326 | if ($tmp_dir ne "" && -d $tmp_dir); | |
327 | } | |
328 | ||
2e33bbbc MM |
329 | umask(002); |
330 | ||
7ebf9245 MM |
331 | find_file_in_spool(); |
332 | read_spool_file(); | |
01806192 | 333 | make_tmp_dir(); |
7ebf9245 | 334 | fetch_files(); |
47f8fda7 | 335 | send_email() unless (!$force_reply and $problems eq "" and $fetched_count == 0); |
01806192 | 336 | clean_tmp_dir(); |