9e052883 |
1 | /* |
2 | * untgz.c -- Display contents and extract files from a gzip'd TAR file |
3 | * |
4 | * written by Pedro A. Aranda Gutierrez <paag@tid.es> |
5 | * adaptation to Unix by Jean-loup Gailly <jloup@gzip.org> |
6 | * various fixes by Cosmin Truta <cosmint@cs.ubbcluj.ro> |
7 | */ |
8 | |
9 | #include <stdio.h> |
10 | #include <stdlib.h> |
11 | #include <string.h> |
12 | #include <time.h> |
13 | #include <errno.h> |
14 | |
15 | #include "zlib.h" |
16 | |
17 | #ifdef unix |
18 | # include <unistd.h> |
19 | #else |
20 | # include <direct.h> |
21 | # include <io.h> |
22 | #endif |
23 | |
24 | #ifdef WIN32 |
25 | #include <windows.h> |
26 | # ifndef F_OK |
27 | # define F_OK 0 |
28 | # endif |
29 | # define mkdir(dirname,mode) _mkdir(dirname) |
30 | # ifdef _MSC_VER |
31 | # define access(path,mode) _access(path,mode) |
32 | # define chmod(path,mode) _chmod(path,mode) |
33 | # define strdup(str) _strdup(str) |
34 | # endif |
35 | #else |
36 | # include <utime.h> |
37 | #endif |
38 | |
39 | |
40 | /* values used in typeflag field */ |
41 | |
42 | #define REGTYPE '0' /* regular file */ |
43 | #define AREGTYPE '\0' /* regular file */ |
44 | #define LNKTYPE '1' /* link */ |
45 | #define SYMTYPE '2' /* reserved */ |
46 | #define CHRTYPE '3' /* character special */ |
47 | #define BLKTYPE '4' /* block special */ |
48 | #define DIRTYPE '5' /* directory */ |
49 | #define FIFOTYPE '6' /* FIFO special */ |
50 | #define CONTTYPE '7' /* reserved */ |
51 | |
52 | /* GNU tar extensions */ |
53 | |
54 | #define GNUTYPE_DUMPDIR 'D' /* file names from dumped directory */ |
55 | #define GNUTYPE_LONGLINK 'K' /* long link name */ |
56 | #define GNUTYPE_LONGNAME 'L' /* long file name */ |
57 | #define GNUTYPE_MULTIVOL 'M' /* continuation of file from another volume */ |
58 | #define GNUTYPE_NAMES 'N' /* file name that does not fit into main hdr */ |
59 | #define GNUTYPE_SPARSE 'S' /* sparse file */ |
60 | #define GNUTYPE_VOLHDR 'V' /* tape/volume header */ |
61 | |
62 | |
63 | /* tar header */ |
64 | |
65 | #define BLOCKSIZE 512 |
66 | #define SHORTNAMESIZE 100 |
67 | |
68 | struct tar_header |
69 | { /* byte offset */ |
70 | char name[100]; /* 0 */ |
71 | char mode[8]; /* 100 */ |
72 | char uid[8]; /* 108 */ |
73 | char gid[8]; /* 116 */ |
74 | char size[12]; /* 124 */ |
75 | char mtime[12]; /* 136 */ |
76 | char chksum[8]; /* 148 */ |
77 | char typeflag; /* 156 */ |
78 | char linkname[100]; /* 157 */ |
79 | char magic[6]; /* 257 */ |
80 | char version[2]; /* 263 */ |
81 | char uname[32]; /* 265 */ |
82 | char gname[32]; /* 297 */ |
83 | char devmajor[8]; /* 329 */ |
84 | char devminor[8]; /* 337 */ |
85 | char prefix[155]; /* 345 */ |
86 | /* 500 */ |
87 | }; |
88 | |
89 | union tar_buffer |
90 | { |
91 | char buffer[BLOCKSIZE]; |
92 | struct tar_header header; |
93 | }; |
94 | |
95 | struct attr_item |
96 | { |
97 | struct attr_item *next; |
98 | char *fname; |
99 | int mode; |
100 | time_t time; |
101 | }; |
102 | |
103 | enum { TGZ_EXTRACT, TGZ_LIST, TGZ_INVALID }; |
104 | |
105 | char *TGZfname OF((const char *)); |
106 | void TGZnotfound OF((const char *)); |
107 | |
108 | int getoct OF((char *, int)); |
109 | char *strtime OF((time_t *)); |
110 | int setfiletime OF((char *, time_t)); |
111 | void push_attr OF((struct attr_item **, char *, int, time_t)); |
112 | void restore_attr OF((struct attr_item **)); |
113 | |
114 | int ExprMatch OF((char *, char *)); |
115 | |
116 | int makedir OF((char *)); |
117 | int matchname OF((int, int, char **, char *)); |
118 | |
119 | void error OF((const char *)); |
120 | int tar OF((gzFile, int, int, int, char **)); |
121 | |
122 | void help OF((int)); |
123 | int main OF((int, char **)); |
124 | |
125 | char *prog; |
126 | |
127 | const char *TGZsuffix[] = { "\0", ".tar", ".tar.gz", ".taz", ".tgz", NULL }; |
128 | |
129 | /* return the file name of the TGZ archive */ |
130 | /* or NULL if it does not exist */ |
131 | |
132 | char *TGZfname (const char *arcname) |
133 | { |
134 | static char buffer[1024]; |
135 | int origlen,i; |
136 | |
137 | strcpy(buffer,arcname); |
138 | origlen = strlen(buffer); |
139 | |
140 | for (i=0; TGZsuffix[i]; i++) |
141 | { |
142 | strcpy(buffer+origlen,TGZsuffix[i]); |
143 | if (access(buffer,F_OK) == 0) |
144 | return buffer; |
145 | } |
146 | return NULL; |
147 | } |
148 | |
149 | |
150 | /* error message for the filename */ |
151 | |
152 | void TGZnotfound (const char *arcname) |
153 | { |
154 | int i; |
155 | |
156 | fprintf(stderr,"%s: Couldn't find ",prog); |
157 | for (i=0;TGZsuffix[i];i++) |
158 | fprintf(stderr,(TGZsuffix[i+1]) ? "%s%s, " : "or %s%s\n", |
159 | arcname, |
160 | TGZsuffix[i]); |
161 | exit(1); |
162 | } |
163 | |
164 | |
165 | /* convert octal digits to int */ |
166 | /* on error return -1 */ |
167 | |
168 | int getoct (char *p,int width) |
169 | { |
170 | int result = 0; |
171 | char c; |
172 | |
173 | while (width--) |
174 | { |
175 | c = *p++; |
176 | if (c == 0) |
177 | break; |
178 | if (c == ' ') |
179 | continue; |
180 | if (c < '0' || c > '7') |
181 | return -1; |
182 | result = result * 8 + (c - '0'); |
183 | } |
184 | return result; |
185 | } |
186 | |
187 | |
188 | /* convert time_t to string */ |
189 | /* use the "YYYY/MM/DD hh:mm:ss" format */ |
190 | |
191 | char *strtime (time_t *t) |
192 | { |
193 | struct tm *local; |
194 | static char result[32]; |
195 | |
196 | local = localtime(t); |
197 | sprintf(result,"%4d/%02d/%02d %02d:%02d:%02d", |
198 | local->tm_year+1900, local->tm_mon+1, local->tm_mday, |
199 | local->tm_hour, local->tm_min, local->tm_sec); |
200 | return result; |
201 | } |
202 | |
203 | |
204 | /* set file time */ |
205 | |
206 | int setfiletime (char *fname,time_t ftime) |
207 | { |
208 | #ifdef WIN32 |
209 | static int isWinNT = -1; |
210 | SYSTEMTIME st; |
211 | FILETIME locft, modft; |
212 | struct tm *loctm; |
213 | HANDLE hFile; |
214 | int result; |
215 | |
216 | loctm = localtime(&ftime); |
217 | if (loctm == NULL) |
218 | return -1; |
219 | |
220 | st.wYear = (WORD)loctm->tm_year + 1900; |
221 | st.wMonth = (WORD)loctm->tm_mon + 1; |
222 | st.wDayOfWeek = (WORD)loctm->tm_wday; |
223 | st.wDay = (WORD)loctm->tm_mday; |
224 | st.wHour = (WORD)loctm->tm_hour; |
225 | st.wMinute = (WORD)loctm->tm_min; |
226 | st.wSecond = (WORD)loctm->tm_sec; |
227 | st.wMilliseconds = 0; |
228 | if (!SystemTimeToFileTime(&st, &locft) || |
229 | !LocalFileTimeToFileTime(&locft, &modft)) |
230 | return -1; |
231 | |
232 | if (isWinNT < 0) |
233 | isWinNT = (GetVersion() < 0x80000000) ? 1 : 0; |
234 | hFile = CreateFile(fname, GENERIC_WRITE, 0, NULL, OPEN_EXISTING, |
235 | (isWinNT ? FILE_FLAG_BACKUP_SEMANTICS : 0), |
236 | NULL); |
237 | if (hFile == INVALID_HANDLE_VALUE) |
238 | return -1; |
239 | result = SetFileTime(hFile, NULL, NULL, &modft) ? 0 : -1; |
240 | CloseHandle(hFile); |
241 | return result; |
242 | #else |
243 | struct utimbuf settime; |
244 | |
245 | settime.actime = settime.modtime = ftime; |
246 | return utime(fname,&settime); |
247 | #endif |
248 | } |
249 | |
250 | |
251 | /* push file attributes */ |
252 | |
253 | void push_attr(struct attr_item **list,char *fname,int mode,time_t time) |
254 | { |
255 | struct attr_item *item; |
256 | |
257 | item = (struct attr_item *)malloc(sizeof(struct attr_item)); |
258 | if (item == NULL) |
259 | error("Out of memory"); |
260 | item->fname = strdup(fname); |
261 | item->mode = mode; |
262 | item->time = time; |
263 | item->next = *list; |
264 | *list = item; |
265 | } |
266 | |
267 | |
268 | /* restore file attributes */ |
269 | |
270 | void restore_attr(struct attr_item **list) |
271 | { |
272 | struct attr_item *item, *prev; |
273 | |
274 | for (item = *list; item != NULL; ) |
275 | { |
276 | setfiletime(item->fname,item->time); |
277 | chmod(item->fname,item->mode); |
278 | prev = item; |
279 | item = item->next; |
280 | free(prev); |
281 | } |
282 | *list = NULL; |
283 | } |
284 | |
285 | |
286 | /* match regular expression */ |
287 | |
288 | #define ISSPECIAL(c) (((c) == '*') || ((c) == '/')) |
289 | |
290 | int ExprMatch (char *string,char *expr) |
291 | { |
292 | while (1) |
293 | { |
294 | if (ISSPECIAL(*expr)) |
295 | { |
296 | if (*expr == '/') |
297 | { |
298 | if (*string != '\\' && *string != '/') |
299 | return 0; |
300 | string ++; expr++; |
301 | } |
302 | else if (*expr == '*') |
303 | { |
304 | if (*expr ++ == 0) |
305 | return 1; |
306 | while (*++string != *expr) |
307 | if (*string == 0) |
308 | return 0; |
309 | } |
310 | } |
311 | else |
312 | { |
313 | if (*string != *expr) |
314 | return 0; |
315 | if (*expr++ == 0) |
316 | return 1; |
317 | string++; |
318 | } |
319 | } |
320 | } |
321 | |
322 | |
323 | /* recursive mkdir */ |
324 | /* abort on ENOENT; ignore other errors like "directory already exists" */ |
325 | /* return 1 if OK */ |
326 | /* 0 on error */ |
327 | |
328 | int makedir (char *newdir) |
329 | { |
330 | char *buffer = strdup(newdir); |
331 | char *p; |
332 | int len = strlen(buffer); |
333 | |
334 | if (len <= 0) { |
335 | free(buffer); |
336 | return 0; |
337 | } |
338 | if (buffer[len-1] == '/') { |
339 | buffer[len-1] = '\0'; |
340 | } |
341 | if (mkdir(buffer, 0755) == 0) |
342 | { |
343 | free(buffer); |
344 | return 1; |
345 | } |
346 | |
347 | p = buffer+1; |
348 | while (1) |
349 | { |
350 | char hold; |
351 | |
352 | while(*p && *p != '\\' && *p != '/') |
353 | p++; |
354 | hold = *p; |
355 | *p = 0; |
356 | if ((mkdir(buffer, 0755) == -1) && (errno == ENOENT)) |
357 | { |
358 | fprintf(stderr,"%s: Couldn't create directory %s\n",prog,buffer); |
359 | free(buffer); |
360 | return 0; |
361 | } |
362 | if (hold == 0) |
363 | break; |
364 | *p++ = hold; |
365 | } |
366 | free(buffer); |
367 | return 1; |
368 | } |
369 | |
370 | |
371 | int matchname (int arg,int argc,char **argv,char *fname) |
372 | { |
373 | if (arg == argc) /* no arguments given (untgz tgzarchive) */ |
374 | return 1; |
375 | |
376 | while (arg < argc) |
377 | if (ExprMatch(fname,argv[arg++])) |
378 | return 1; |
379 | |
380 | return 0; /* ignore this for the moment being */ |
381 | } |
382 | |
383 | |
384 | /* tar file list or extract */ |
385 | |
386 | int tar (gzFile in,int action,int arg,int argc,char **argv) |
387 | { |
388 | union tar_buffer buffer; |
389 | int len; |
390 | int err; |
391 | int getheader = 1; |
392 | int remaining = 0; |
393 | FILE *outfile = NULL; |
394 | char fname[BLOCKSIZE]; |
395 | int tarmode; |
396 | time_t tartime; |
397 | struct attr_item *attributes = NULL; |
398 | |
399 | if (action == TGZ_LIST) |
400 | printf(" date time size file\n" |
401 | " ---------- -------- --------- -------------------------------------\n"); |
402 | while (1) |
403 | { |
404 | len = gzread(in, &buffer, BLOCKSIZE); |
405 | if (len < 0) |
406 | error(gzerror(in, &err)); |
407 | /* |
408 | * Always expect complete blocks to process |
409 | * the tar information. |
410 | */ |
411 | if (len != BLOCKSIZE) |
412 | { |
413 | action = TGZ_INVALID; /* force error exit */ |
414 | remaining = 0; /* force I/O cleanup */ |
415 | } |
416 | |
417 | /* |
418 | * If we have to get a tar header |
419 | */ |
420 | if (getheader >= 1) |
421 | { |
422 | /* |
423 | * if we met the end of the tar |
424 | * or the end-of-tar block, |
425 | * we are done |
426 | */ |
427 | if (len == 0 || buffer.header.name[0] == 0) |
428 | break; |
429 | |
430 | tarmode = getoct(buffer.header.mode,8); |
431 | tartime = (time_t)getoct(buffer.header.mtime,12); |
432 | if (tarmode == -1 || tartime == (time_t)-1) |
433 | { |
434 | buffer.header.name[0] = 0; |
435 | action = TGZ_INVALID; |
436 | } |
437 | |
438 | if (getheader == 1) |
439 | { |
440 | strncpy(fname,buffer.header.name,SHORTNAMESIZE); |
441 | if (fname[SHORTNAMESIZE-1] != 0) |
442 | fname[SHORTNAMESIZE] = 0; |
443 | } |
444 | else |
445 | { |
446 | /* |
447 | * The file name is longer than SHORTNAMESIZE |
448 | */ |
449 | if (strncmp(fname,buffer.header.name,SHORTNAMESIZE-1) != 0) |
450 | error("bad long name"); |
451 | getheader = 1; |
452 | } |
453 | |
454 | /* |
455 | * Act according to the type flag |
456 | */ |
457 | switch (buffer.header.typeflag) |
458 | { |
459 | case DIRTYPE: |
460 | if (action == TGZ_LIST) |
461 | printf(" %s <dir> %s\n",strtime(&tartime),fname); |
462 | if (action == TGZ_EXTRACT) |
463 | { |
464 | makedir(fname); |
465 | push_attr(&attributes,fname,tarmode,tartime); |
466 | } |
467 | break; |
468 | case REGTYPE: |
469 | case AREGTYPE: |
470 | remaining = getoct(buffer.header.size,12); |
471 | if (remaining == -1) |
472 | { |
473 | action = TGZ_INVALID; |
474 | break; |
475 | } |
476 | if (action == TGZ_LIST) |
477 | printf(" %s %9d %s\n",strtime(&tartime),remaining,fname); |
478 | else if (action == TGZ_EXTRACT) |
479 | { |
480 | if (matchname(arg,argc,argv,fname)) |
481 | { |
482 | outfile = fopen(fname,"wb"); |
483 | if (outfile == NULL) { |
484 | /* try creating directory */ |
485 | char *p = strrchr(fname, '/'); |
486 | if (p != NULL) { |
487 | *p = '\0'; |
488 | makedir(fname); |
489 | *p = '/'; |
490 | outfile = fopen(fname,"wb"); |
491 | } |
492 | } |
493 | if (outfile != NULL) |
494 | printf("Extracting %s\n",fname); |
495 | else |
496 | fprintf(stderr, "%s: Couldn't create %s",prog,fname); |
497 | } |
498 | else |
499 | outfile = NULL; |
500 | } |
501 | getheader = 0; |
502 | break; |
503 | case GNUTYPE_LONGLINK: |
504 | case GNUTYPE_LONGNAME: |
505 | remaining = getoct(buffer.header.size,12); |
506 | if (remaining < 0 || remaining >= BLOCKSIZE) |
507 | { |
508 | action = TGZ_INVALID; |
509 | break; |
510 | } |
511 | len = gzread(in, fname, BLOCKSIZE); |
512 | if (len < 0) |
513 | error(gzerror(in, &err)); |
514 | if (fname[BLOCKSIZE-1] != 0 || (int)strlen(fname) > remaining) |
515 | { |
516 | action = TGZ_INVALID; |
517 | break; |
518 | } |
519 | getheader = 2; |
520 | break; |
521 | default: |
522 | if (action == TGZ_LIST) |
523 | printf(" %s <---> %s\n",strtime(&tartime),fname); |
524 | break; |
525 | } |
526 | } |
527 | else |
528 | { |
529 | unsigned int bytes = (remaining > BLOCKSIZE) ? BLOCKSIZE : remaining; |
530 | |
531 | if (outfile != NULL) |
532 | { |
533 | if (fwrite(&buffer,sizeof(char),bytes,outfile) != bytes) |
534 | { |
535 | fprintf(stderr, |
536 | "%s: Error writing %s -- skipping\n",prog,fname); |
537 | fclose(outfile); |
538 | outfile = NULL; |
539 | remove(fname); |
540 | } |
541 | } |
542 | remaining -= bytes; |
543 | } |
544 | |
545 | if (remaining == 0) |
546 | { |
547 | getheader = 1; |
548 | if (outfile != NULL) |
549 | { |
550 | fclose(outfile); |
551 | outfile = NULL; |
552 | if (action != TGZ_INVALID) |
553 | push_attr(&attributes,fname,tarmode,tartime); |
554 | } |
555 | } |
556 | |
557 | /* |
558 | * Abandon if errors are found |
559 | */ |
560 | if (action == TGZ_INVALID) |
561 | { |
562 | error("broken archive"); |
563 | break; |
564 | } |
565 | } |
566 | |
567 | /* |
568 | * Restore file modes and time stamps |
569 | */ |
570 | restore_attr(&attributes); |
571 | |
572 | if (gzclose(in) != Z_OK) |
573 | error("failed gzclose"); |
574 | |
575 | return 0; |
576 | } |
577 | |
578 | |
579 | /* ============================================================ */ |
580 | |
581 | void help(int exitval) |
582 | { |
583 | printf("untgz version 0.2.1\n" |
584 | " using zlib version %s\n\n", |
585 | zlibVersion()); |
586 | printf("Usage: untgz file.tgz extract all files\n" |
587 | " untgz file.tgz fname ... extract selected files\n" |
588 | " untgz -l file.tgz list archive contents\n" |
589 | " untgz -h display this help\n"); |
590 | exit(exitval); |
591 | } |
592 | |
593 | void error(const char *msg) |
594 | { |
595 | fprintf(stderr, "%s: %s\n", prog, msg); |
596 | exit(1); |
597 | } |
598 | |
599 | |
600 | /* ============================================================ */ |
601 | |
602 | #if defined(WIN32) && defined(__GNUC__) |
603 | int _CRT_glob = 0; /* disable argument globbing in MinGW */ |
604 | #endif |
605 | |
606 | int main(int argc,char **argv) |
607 | { |
608 | int action = TGZ_EXTRACT; |
609 | int arg = 1; |
610 | char *TGZfile; |
611 | gzFile *f; |
612 | |
613 | prog = strrchr(argv[0],'\\'); |
614 | if (prog == NULL) |
615 | { |
616 | prog = strrchr(argv[0],'/'); |
617 | if (prog == NULL) |
618 | { |
619 | prog = strrchr(argv[0],':'); |
620 | if (prog == NULL) |
621 | prog = argv[0]; |
622 | else |
623 | prog++; |
624 | } |
625 | else |
626 | prog++; |
627 | } |
628 | else |
629 | prog++; |
630 | |
631 | if (argc == 1) |
632 | help(0); |
633 | |
634 | if (strcmp(argv[arg],"-l") == 0) |
635 | { |
636 | action = TGZ_LIST; |
637 | if (argc == ++arg) |
638 | help(0); |
639 | } |
640 | else if (strcmp(argv[arg],"-h") == 0) |
641 | { |
642 | help(0); |
643 | } |
644 | |
645 | if ((TGZfile = TGZfname(argv[arg])) == NULL) |
646 | TGZnotfound(argv[arg]); |
647 | |
648 | ++arg; |
649 | if ((action == TGZ_LIST) && (arg != argc)) |
650 | help(1); |
651 | |
652 | /* |
653 | * Process the TGZ file |
654 | */ |
655 | switch(action) |
656 | { |
657 | case TGZ_LIST: |
658 | case TGZ_EXTRACT: |
659 | f = gzopen(TGZfile,"rb"); |
660 | if (f == NULL) |
661 | { |
662 | fprintf(stderr,"%s: Couldn't gzopen %s\n",prog,TGZfile); |
663 | return 1; |
664 | } |
665 | exit(tar(f, action, arg, argc, argv)); |
666 | break; |
667 | |
668 | default: |
669 | error("Unknown option"); |
670 | exit(1); |
671 | } |
672 | |
673 | return 0; |
674 | } |