-
Notifications
You must be signed in to change notification settings - Fork 0
/
client.c
718 lines (634 loc) · 23.5 KB
/
client.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
/*
* zsync - client side rsync over http
* Copyright (C) 2004,2005,2007,2009 Colin Phipps <cph@moria.org.uk>
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the Artistic License v2 (see the accompanying
* file COPYING for the full license terms), or, at your option, any later
* version of the same license.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* COPYING file for details.
*/
/* zsync command-line client program */
#include "zsglobal.h"
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <fcntl.h>
#include <errno.h>
#include <ctype.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <utime.h>
#ifdef WITH_DMALLOC
# include <dmalloc.h>
#endif
#include "libzsync/zsync.h"
#include "http.h"
#include "url.h"
#include "progress.h"
/* FILE* f = open_zcat_pipe(file_str)
* Returns a (popen) filehandle which when read returns the un-gzipped content
* of the given file. Or NULL on error; or the filehandle may fail to read. It
* is up to the caller to call pclose() on the handle and check the return
* value of that.
*/
FILE* open_zcat_pipe(const char* fname)
{
/* Get buffer to build command line */
char *cmd = malloc(6 + strlen(fname) * 2);
if (!cmd)
return NULL;
strcpy(cmd, "zcat ");
{ /* Add filename to commandline, escaping any characters that the shell
*might consider special. */
int i, j;
for (i = 0, j = 5; fname[i]; i++) {
if (!isalnum(fname[i]))
cmd[j++] = '\\';
cmd[j++] = fname[i];
}
cmd[j] = 0;
}
if (!no_progress)
fprintf(stderr, "reading seed %s: ", cmd);
{ /* Finally, open the subshell for reading, and return the handle */
FILE* f = popen(cmd, "r");
free(cmd);
return f;
}
}
/* read_seed_file(zsync, filename_str)
* Reads the given file (decompressing it if appropriate) and applies the rsync
* checksum algorithm to it, so any data that is contained in the target file
* is written to the in-progress target. So use this function to supply local
* source files which are believed to have data in common with the target.
*/
void read_seed_file(struct zsync_state *z, const char *fname) {
/* If we should decompress this file */
if (zsync_hint_decompress(z) && strlen(fname) > 3
&& !strcmp(fname + strlen(fname) - 3, ".gz")) {
/* Open for reading */
FILE *f = open_zcat_pipe(fname);
if (!f) {
perror("popen");
fprintf(stderr, "not using seed file %s\n", fname);
}
else {
/* Give the contents to libzsync to read and find any useful
* content */
zsync_submit_source_file(z, f, !no_progress);
/* Close and check for errors */
if (pclose(f) != 0) {
perror("close");
}
}
}
else {
/* Simple uncompressed file - open it */
FILE *f = fopen(fname, "r");
if (!f) {
perror("open");
fprintf(stderr, "not using seed file %s\n", fname);
}
else {
/* Give the contents to libzsync to read, to find any content that
* is part of the target file. */
if (!no_progress)
fprintf(stderr, "reading seed file %s: ", fname);
zsync_submit_source_file(z, f, !no_progress);
/* And close */
if (fclose(f) != 0) {
perror("close");
}
}
}
{ /* And print how far we've progressed towards the target file */
long long done, total;
zsync_progress(z, &done, &total);
if (!no_progress)
fprintf(stderr, "\rDone reading %s. %02.1f%% of target obtained. \n",
fname, (100.0f * done) / total);
}
}
long long http_down;
/* A ptrlist is a very simple structure for storing lists of pointers. This is
* the only function in its API. The structure (not actually a struct) consists
* of a (pointer to a) void*[] and an int giving the number of entries.
*
* ptrlist = append_ptrlist(&entries, ptrlist, new_entry)
* Like realloc(2), this returns the new location of the ptrlist array; the
* number of entries is passed by reference and updated in place. The new entry
* is appended to the list.
*/
static void **append_ptrlist(int *n, void **p, void *a) {
if (!a)
return p;
p = realloc(p, (*n + 1) * sizeof *p);
if (!p) {
fprintf(stderr, "out of memory\n");
exit(1);
}
p[*n] = a;
(*n)++;
return p;
}
/* zs = read_zsync_control_file(location_str, filename)
* Reads a zsync control file from either a URL or filename specified in
* location_str. This is treated as a URL if no local file exists of that name
* and it starts with a URL scheme ; only http URLs are supported.
* Second parameter is a filename in which to locally save the content of the
* .zsync _if it is retrieved from a URL_; can be NULL in which case no local
* copy is made.
*/
struct zsync_state *read_zsync_control_file(const char *p, const char *fn) {
FILE *f;
struct zsync_state *zs;
char *lastpath = NULL;
/* Try opening as a local path */
f = fopen(p, "r");
if (!f) {
/* No such local file - if not a URL either, report error */
if (!is_url_absolute(p)) {
perror(p);
exit(2);
}
/* Try URL fetch */
f = http_get(p, &lastpath, fn);
if (!f) {
fprintf(stderr, "could not read control file from URL %s\n", p);
exit(3);
}
referer = lastpath;
}
/* Read the .zsync */
if ((zs = zsync_begin(f)) == NULL) {
exit(1);
}
/* And close it */
if (fclose(f) != 0) {
perror("fclose");
exit(2);
}
return zs;
}
/* str = get_filename_prefix(path_str)
* Returns a (malloced) string of the alphanumeric leading segment of the
* filename in the given file path.
*/
static char *get_filename_prefix(const char *p) {
char *s = strdup(p);
char *t = strrchr(s, '/');
char *u;
if (t)
*t++ = 0;
else
t = s;
u = t;
while (isalnum(*u)) {
u++;
}
*u = 0;
if (*t > 0)
t = strdup(t);
else
t = NULL;
free(s);
return t;
}
/* filename_str = get_filename(zs, source_filename_str)
* Returns a (malloced string with a) suitable filename for a zsync download,
* using the given zsync state and source filename strings as hints. */
char *get_filename(const struct zsync_state *zs, const char *source_name) {
char *p = zsync_filename(zs);
char *filename = NULL;
if (p) {
if (strchr(p, '/')) {
fprintf(stderr,
"Rejected filename specified in %s, contained path component.\n",
source_name);
free(p);
}
else {
char *t = get_filename_prefix(source_name);
if (t && !memcmp(p, t, strlen(t)))
filename = p;
else
free(p);
if (t && !filename) {
fprintf(stderr,
"Rejected filename specified in %s - prefix %s differed from filename %s.\n",
source_name, t, p);
}
free(t);
}
}
if (!filename) {
filename = get_filename_prefix(source_name);
if (!filename)
filename = strdup("zsync-download");
}
return filename;
}
/* prog = calc_zsync_progress(zs)
* Returns the progress ratio 0..1 (none...done) for the given zsync_state */
static float calc_zsync_progress(const struct zsync_state *zs) {
long long zgot, ztot;
zsync_progress(zs, &zgot, &ztot);
return (100.0f * zgot / ztot);
}
/* fetch_remaining_blocks_http(struct zsync*, const char* url, int type)
* For the given zsync_state, using the given absolute HTTP URL (which is a
* copy of the actual content of the target file is type == 0, or a compressed
* copy of it if type == 1), retrieve the parts of the target that are
* currently missing.
* Returns 0 if this URL was useful, non-zero if we crashed and burned.
*/
#define BUFFERSIZE 8192
int fetch_remaining_blocks_http(struct zsync_state *z, const char *u,
int type) {
int ret = 0;
struct range_fetch *rf;
unsigned char *buf;
struct zsync_receiver *zr;
/* Start a range fetch and a zsync receiver */
rf = range_fetch_start(u);
if (!rf) {
return -1;
}
zr = zsync_begin_receive(z, type);
if (!zr) {
range_fetch_end(rf);
return -1;
}
if (!no_progress)
fprintf(stderr, "downloading new blocks from %s:", u);
/* Create a read buffer */
buf = malloc(BUFFERSIZE);
if (!buf) {
zsync_end_receive(zr);
range_fetch_end(rf);
return -1;
}
{ /* Get a set of byte ranges that we need to complete the target */
int nrange;
off_t *zbyterange = zsync_needed_byte_ranges(z, &nrange, type);
if (!zbyterange)
return 1;
if (nrange == 0)
return 0;
/* And give that to the range fetcher */
range_fetch_addranges(rf, zbyterange, nrange);
free(zbyterange);
}
{
int len;
off_t zoffset;
struct progress *p;
/* Set up progress display to run during the fetch */
if (!no_progress) {
fputc('\n', stderr);
p = start_progress();
do_progress(p, calc_zsync_progress(z), range_fetch_bytes_down(rf));
}
/* Loop while we're receiving data, until we're done or there is an error */
while (!ret
&& (len = get_range_block(rf, &zoffset, buf, BUFFERSIZE)) > 0) {
/* Pass received data to the zsync receiver, which writes it to the
* appropriate location in the target file */
if (zsync_receive_data(zr, buf, zoffset, len) != 0)
ret = 1;
/* Maintain progress display */
if (!no_progress)
do_progress(p, calc_zsync_progress(z),
range_fetch_bytes_down(rf));
// Needed in case next call returns len=0 and we need to signal where the EOF was.
zoffset += len;
}
/* If error, we need to flag that to our caller */
if (len < 0)
ret = -1;
else /* Else, let the zsync receiver know that we're at EOF; there
*could be data in its buffer that it can use or needs to process */
if (zsync_receive_data(zr, NULL, zoffset, 0) != 0)
ret = 1;
if (!no_progress)
end_progress(p, zsync_status(z) >= 2 ? 2 : len == 0 ? 1 : 0);
}
/* Clean up */
free(buf);
http_down += range_fetch_bytes_down(rf);
zsync_end_receive(zr);
range_fetch_end(rf);
return ret;
}
/* fetch_remaining_blocks_from_url(struct zsync_state*, url, type)
* For the given zsync_state, using the given URL (which is a copy of the
* actual content of the target file is type == 0, or a compressed copy of it
* if type == 1), retrieve the parts of the target that are currently missing.
* Returns true if this URL was useful, false if we crashed and burned.
*/
int fetch_remaining_blocks_from_url(struct zsync_state *zs, const char *url,
int type) {
/* URL might be relative - we need an absolute URL to do a fetch */
char *abs_url = make_url_absolute(referer, url);
if (!abs_url) {
fprintf(stderr,
"URL '%s' from the .zsync file is relative, but I don't know the referer URL (you probably downloaded the .zsync separately and gave it to me as a file). I need to know the referring URL (the URL of the .zsync) in order to locate the download. You can specify this with -u (or edit the URL line(s) in the .zsync file you have).\n",
url);
return -1;
}
/* Try fetching data from this URL */
int rc = fetch_remaining_blocks_http(zs, abs_url, type);
if (rc != 0) {
fprintf(stderr, "failed to retrieve from %s\n", abs_url);
}
free(abs_url);
return rc;
}
/* int fetch_remaining_blocks(struct zsync_state*)
* Using the URLs in the supplied zsync state, downloads data to complete the
* target file.
* Returns 0 if there were no URLs to download from, 1 if there were (in which
* case consult zsync_status to see how far it got).
*/
int fetch_remaining_blocks(struct zsync_state *zs) {
int n, utype;
const char *const *url = zsync_get_urls(zs, &n, &utype);
int *status; /* keep status for each URL - 0 means no error */
int ok_urls = n;
if (!url) {
fprintf(stderr, "No download URLs known");
return 0;
}
status = calloc(n, sizeof *status);
/* Keep going until we're done or have no useful URLs left */
while (zsync_status(zs) < 2 && ok_urls) {
/* Still need data; pick a URL to use. */
int try = rand() % n;
if (!status[try]) {
/* Try fetching data from this URL */
int rc = fetch_remaining_blocks_from_url(zs, url[try], utype);
if (rc != 0) {
status[try] = 1;
ok_urls--;
}
}
}
free(status);
return 1;
}
static int set_mtime(char* filename, time_t mtime) {
struct stat s;
struct utimbuf u;
/* Get the access time, which I don't want to modify. */
if (stat(filename, &s) != 0) {
perror("stat");
return -1;
}
/* Set the modification time. */
u.actime = s.st_atime;
u.modtime = mtime;
if (utime(filename, &u) != 0) {
perror("utime");
return -1;
}
return 0;
}
/****************************************************************************
*
* Main program */
int main(int argc, char **argv) {
struct zsync_state *zs;
char *temp_file = NULL;
char **seedfiles = NULL;
int nseedfiles = 0;
char *filename = NULL;
long long local_used;
char *zfname = NULL;
time_t mtime;
srand(getpid());
{ /* Option parsing */
int opt;
while ((opt = getopt(argc, argv, "A:k:o:i:Vsqu:")) != -1) {
switch (opt) {
case 'A': /* Authentication options for remote server */
{ /* Scan string as hostname=username:password */
char *p = strdup(optarg);
char *q = strchr(p, '=');
char *r = q ? strchr(q, ':') : NULL;
if (!q || !r) {
fprintf(stderr,
"-A takes hostname=username:password\n");
exit(1);
}
else {
*q++ = *r++ = 0;
add_auth(p, q, r);
}
}
break;
case 'k':
free(zfname);
zfname = strdup(optarg);
break;
case 'o':
free(filename);
filename = strdup(optarg);
break;
case 'i':
seedfiles = append_ptrlist(&nseedfiles, seedfiles, optarg);
break;
case 'V':
printf(PACKAGE " v" VERSION " (compiled " __DATE__ " " __TIME__
")\n" "By Colin Phipps <cph@moria.org.uk>\n"
"Published under the Artistic License v2, see the COPYING file for details.\n");
exit(0);
case 's':
case 'q':
no_progress = 1;
break;
case 'u':
referer = strdup(optarg);
break;
}
}
}
/* Last and only non-option parameter must be the path/URL of the .zsync */
if (optind == argc) {
fprintf(stderr,
"No .zsync file specified.\nUsage: zsync http://example.com/some/filename.zsync\n");
exit(3);
}
else if (optind < argc - 1) {
fprintf(stderr,
"Usage: zsync http://example.com/some/filename.zsync\n");
exit(3);
}
/* No progress display except on terminal */
if (!isatty(0))
no_progress = 1;
{ /* Get proxy setting from the environment */
char *pr = getenv("http_proxy");
if (pr != NULL)
set_proxy_from_string(pr);
}
/* STEP 1: Read the zsync control file */
if ((zs = read_zsync_control_file(argv[optind], zfname)) == NULL)
exit(1);
/* Get eventual filename for output, and filename to write to while working */
if (!filename)
filename = get_filename(zs, argv[optind]);
temp_file = malloc(strlen(filename) + 6);
strcpy(temp_file, filename);
strcat(temp_file, ".part");
{ /* STEP 2: read available local data and fill in what we know in the
*target file */
int i;
/* If the target file already exists, we're probably updating that file
* - so it's a seed file */
if (!access(filename, R_OK)) {
seedfiles = append_ptrlist(&nseedfiles, seedfiles, filename);
}
/* If the .part file exists, it's probably an interrupted earlier
* effort; a normal HTTP client would 'resume' from where it got to,
* but zsync can't (because we don't know this data corresponds to the
* current version on the remote) and doesn't need to, because we can
* treat it like any other local source of data. Use it now. */
if (!access(temp_file, R_OK)) {
seedfiles = append_ptrlist(&nseedfiles, seedfiles, temp_file);
}
/* Try any seed files supplied by the command line */
for (i = 0; i < nseedfiles; i++) {
int dup = 0, j;
/* And stop reading seed files once the target is complete. */
if (zsync_status(zs) >= 2) break;
/* Skip dups automatically, to save the person running the program
* having to worry about this stuff. */
for (j = 0; j < i; j++) {
if (!strcmp(seedfiles[i],seedfiles[j])) dup = 1;
}
/* And now, if not a duplicate, read it */
if (!dup)
read_seed_file(zs, seedfiles[i]);
}
/* Show how far that got us */
zsync_progress(zs, &local_used, NULL);
/* People that don't understand zsync might use it wrongly and end up
* downloading everything. Although not essential, let's hint to them
* that they probably messed up. */
if (!local_used) {
if (!no_progress)
fputs
("No relevent local data found - I will be downloading the whole file. If that's not what you want, CTRL-C out. You should specify the local file is the old version of the file to download with -i (you might have to decompress it with gzip -d first). Or perhaps you just have no data that helps download the file\n",
stderr);
}
}
/* libzsync has been writing to a randomely-named temp file so far -
* because we didn't want to overwrite the .part from previous runs. Now
* we've read any previous .part, we can replace it with our new
* in-progress run (which should be a superset of the old .part - unless
* the content changed, in which case it still contains anything relevant
* from the old .part). */
if (zsync_rename_file(zs, temp_file) != 0) {
perror("rename");
exit(1);
}
/* STEP 3: fetch remaining blocks via the URLs from the .zsync */
{
int fetch_status = fetch_remaining_blocks(zs);
int target_status = zsync_status(zs);
if (target_status < 2) {
fprintf(stderr,
"%s. Incomplete transfer left in %s.\n(If this is the download filename with .part appended, zsync will automatically pick this up and reuse the data it has already done if you retry in this dir.)\n",
fetch_status == 0
? "No download URLs are known, so no data could be downloaded. The .zsync file is probably incomplete."
: target_status == 0
? "No data downloaded - none of the download URLs worked"
: "Not all of the required data could be downloaded, and the remaining data could not be retrieved from any of the download URLs.",
temp_file);
exit(3);
}
}
{ /* STEP 4: verify download */
int r;
if (!no_progress)
printf("verifying download...");
r = zsync_complete(zs);
switch (r) {
case -1:
fprintf(stderr, "Aborting, download available in %s\n", temp_file);
exit(2);
case 0:
if (!no_progress)
printf("no recognised checksum found\n");
break;
case 1:
if (!no_progress)
printf("checksum matches OK\n");
break;
}
}
free(temp_file);
/* Get any mtime that we is suggested to set for the file, and then shut
* down the zsync_state as we are done on the file transfer. Getting the
* current name of the file at the same time. */
mtime = zsync_mtime(zs);
temp_file = zsync_end(zs);
/* STEP 5: Move completed .part file into place as the final target */
if (filename) {
char *oldfile_backup = malloc(strlen(filename) + 8);
int ok = 1;
strcpy(oldfile_backup, filename);
strcat(oldfile_backup, ".zs-old");
if (!access(filename, F_OK)) {
/* Backup the old file. */
/* First, remove any previous backup. We don't care if this fails -
* the link below will catch any failure */
unlink(oldfile_backup);
/* Try linking the filename to the backup file name, so we will
atomically replace the target file in the next step.
If that fails due to EPERM, it is probably a filesystem that
doesn't support hard-links - so try just renaming it to the
backup filename. */
if (link(filename, oldfile_backup) != 0
&& (errno != EPERM || rename(filename, oldfile_backup) != 0)) {
perror("linkname");
fprintf(stderr,
"Unable to back up old file %s - completed download left in %s\n",
filename, temp_file);
ok = 0; /* Prevent overwrite of old file below */
}
}
if (ok) {
/* Rename the file to the desired name */
if (rename(temp_file, filename) == 0) {
/* final, final thing - set the mtime on the file if we have one */
if (mtime != -1) set_mtime(filename, mtime);
}
else {
perror("rename");
fprintf(stderr,
"Unable to back up old file %s - completed download left in %s\n",
filename, temp_file);
}
}
free(oldfile_backup);
free(filename);
}
else {
printf
("No filename specified for download - completed download left in %s\n",
temp_file);
}
/* Final stats and cleanup */
if (!no_progress)
printf("used %lld local, fetched %lld\n", local_used, http_down);
free(referer);
free(temp_file);
return 0;
}