]>
Commit | Line | Data |
---|---|---|
7c673cae FG |
1 | /* |
2 | * untgz.c -- Display contents and extract files from a gzip'd TAR file | |
3 | * | |
4 | * written by Pedro A. Aranda Gutierrez <paag@tid.es> | |
5 | * adaptation to Unix by Jean-loup Gailly <jloup@gzip.org> | |
6 | * various fixes by Cosmin Truta <cosmint@cs.ubbcluj.ro> | |
7 | */ | |
8 | ||
9 | #include <stdio.h> | |
10 | #include <stdlib.h> | |
11 | #include <string.h> | |
12 | #include <time.h> | |
13 | #include <errno.h> | |
14 | ||
15 | #include "zlib.h" | |
16 | ||
17 | #ifdef unix | |
18 | # include <unistd.h> | |
19 | #else | |
20 | # include <direct.h> | |
21 | # include <io.h> | |
22 | #endif | |
23 | ||
24 | #ifdef WIN32 | |
25 | #include <windows.h> | |
26 | # ifndef F_OK | |
27 | # define F_OK 0 | |
28 | # endif | |
29 | # define mkdir(dirname,mode) _mkdir(dirname) | |
30 | # ifdef _MSC_VER | |
31 | # define access(path,mode) _access(path,mode) | |
32 | # define chmod(path,mode) _chmod(path,mode) | |
33 | # define strdup(str) _strdup(str) | |
34 | # endif | |
35 | #else | |
36 | # include <utime.h> | |
37 | #endif | |
38 | ||
39 | ||
40 | /* values used in typeflag field */ | |
41 | ||
42 | #define REGTYPE '0' /* regular file */ | |
43 | #define AREGTYPE '\0' /* regular file */ | |
44 | #define LNKTYPE '1' /* link */ | |
45 | #define SYMTYPE '2' /* reserved */ | |
46 | #define CHRTYPE '3' /* character special */ | |
47 | #define BLKTYPE '4' /* block special */ | |
48 | #define DIRTYPE '5' /* directory */ | |
49 | #define FIFOTYPE '6' /* FIFO special */ | |
50 | #define CONTTYPE '7' /* reserved */ | |
51 | ||
52 | /* GNU tar extensions */ | |
53 | ||
54 | #define GNUTYPE_DUMPDIR 'D' /* file names from dumped directory */ | |
55 | #define GNUTYPE_LONGLINK 'K' /* long link name */ | |
56 | #define GNUTYPE_LONGNAME 'L' /* long file name */ | |
57 | #define GNUTYPE_MULTIVOL 'M' /* continuation of file from another volume */ | |
58 | #define GNUTYPE_NAMES 'N' /* file name that does not fit into main hdr */ | |
59 | #define GNUTYPE_SPARSE 'S' /* sparse file */ | |
60 | #define GNUTYPE_VOLHDR 'V' /* tape/volume header */ | |
61 | ||
62 | ||
63 | /* tar header */ | |
64 | ||
65 | #define BLOCKSIZE 512 | |
66 | #define SHORTNAMESIZE 100 | |
67 | ||
68 | struct tar_header | |
69 | { /* byte offset */ | |
70 | char name[100]; /* 0 */ | |
71 | char mode[8]; /* 100 */ | |
72 | char uid[8]; /* 108 */ | |
73 | char gid[8]; /* 116 */ | |
74 | char size[12]; /* 124 */ | |
75 | char mtime[12]; /* 136 */ | |
76 | char chksum[8]; /* 148 */ | |
77 | char typeflag; /* 156 */ | |
78 | char linkname[100]; /* 157 */ | |
79 | char magic[6]; /* 257 */ | |
80 | char version[2]; /* 263 */ | |
81 | char uname[32]; /* 265 */ | |
82 | char gname[32]; /* 297 */ | |
83 | char devmajor[8]; /* 329 */ | |
84 | char devminor[8]; /* 337 */ | |
85 | char prefix[155]; /* 345 */ | |
86 | /* 500 */ | |
87 | }; | |
88 | ||
89 | union tar_buffer | |
90 | { | |
91 | char buffer[BLOCKSIZE]; | |
92 | struct tar_header header; | |
93 | }; | |
94 | ||
95 | struct attr_item | |
96 | { | |
97 | struct attr_item *next; | |
98 | char *fname; | |
99 | int mode; | |
100 | time_t time; | |
101 | }; | |
102 | ||
103 | enum { TGZ_EXTRACT, TGZ_LIST, TGZ_INVALID }; | |
104 | ||
105 | char *TGZfname OF((const char *)); | |
106 | void TGZnotfound OF((const char *)); | |
107 | ||
108 | int getoct OF((char *, int)); | |
109 | char *strtime OF((time_t *)); | |
110 | int setfiletime OF((char *, time_t)); | |
111 | void push_attr OF((struct attr_item **, char *, int, time_t)); | |
112 | void restore_attr OF((struct attr_item **)); | |
113 | ||
114 | int ExprMatch OF((char *, char *)); | |
115 | ||
116 | int makedir OF((char *)); | |
117 | int matchname OF((int, int, char **, char *)); | |
118 | ||
119 | void error OF((const char *)); | |
120 | int tar OF((gzFile, int, int, int, char **)); | |
121 | ||
122 | void help OF((int)); | |
123 | int main OF((int, char **)); | |
124 | ||
125 | char *prog; | |
126 | ||
127 | const char *TGZsuffix[] = { "\0", ".tar", ".tar.gz", ".taz", ".tgz", NULL }; | |
128 | ||
129 | /* return the file name of the TGZ archive */ | |
130 | /* or NULL if it does not exist */ | |
131 | ||
132 | char *TGZfname (const char *arcname) | |
133 | { | |
134 | static char buffer[1024]; | |
135 | int origlen,i; | |
136 | ||
137 | strcpy(buffer,arcname); | |
138 | origlen = strlen(buffer); | |
139 | ||
140 | for (i=0; TGZsuffix[i]; i++) | |
141 | { | |
142 | strcpy(buffer+origlen,TGZsuffix[i]); | |
143 | if (access(buffer,F_OK) == 0) | |
144 | return buffer; | |
145 | } | |
146 | return NULL; | |
147 | } | |
148 | ||
149 | ||
150 | /* error message for the filename */ | |
151 | ||
152 | void TGZnotfound (const char *arcname) | |
153 | { | |
154 | int i; | |
155 | ||
156 | fprintf(stderr,"%s: Couldn't find ",prog); | |
157 | for (i=0;TGZsuffix[i];i++) | |
158 | fprintf(stderr,(TGZsuffix[i+1]) ? "%s%s, " : "or %s%s\n", | |
159 | arcname, | |
160 | TGZsuffix[i]); | |
161 | exit(1); | |
162 | } | |
163 | ||
164 | ||
165 | /* convert octal digits to int */ | |
166 | /* on error return -1 */ | |
167 | ||
168 | int getoct (char *p,int width) | |
169 | { | |
170 | int result = 0; | |
171 | char c; | |
172 | ||
173 | while (width--) | |
174 | { | |
175 | c = *p++; | |
176 | if (c == 0) | |
177 | break; | |
178 | if (c == ' ') | |
179 | continue; | |
180 | if (c < '0' || c > '7') | |
181 | return -1; | |
182 | result = result * 8 + (c - '0'); | |
183 | } | |
184 | return result; | |
185 | } | |
186 | ||
187 | ||
188 | /* convert time_t to string */ | |
189 | /* use the "YYYY/MM/DD hh:mm:ss" format */ | |
190 | ||
191 | char *strtime (time_t *t) | |
192 | { | |
193 | struct tm *local; | |
194 | static char result[32]; | |
195 | ||
196 | local = localtime(t); | |
197 | sprintf(result,"%4d/%02d/%02d %02d:%02d:%02d", | |
198 | local->tm_year+1900, local->tm_mon+1, local->tm_mday, | |
199 | local->tm_hour, local->tm_min, local->tm_sec); | |
200 | return result; | |
201 | } | |
202 | ||
203 | ||
204 | /* set file time */ | |
205 | ||
206 | int setfiletime (char *fname,time_t ftime) | |
207 | { | |
208 | #ifdef WIN32 | |
209 | static int isWinNT = -1; | |
210 | SYSTEMTIME st; | |
211 | FILETIME locft, modft; | |
212 | struct tm *loctm; | |
213 | HANDLE hFile; | |
214 | int result; | |
215 | ||
216 | loctm = localtime(&ftime); | |
217 | if (loctm == NULL) | |
218 | return -1; | |
219 | ||
220 | st.wYear = (WORD)loctm->tm_year + 1900; | |
221 | st.wMonth = (WORD)loctm->tm_mon + 1; | |
222 | st.wDayOfWeek = (WORD)loctm->tm_wday; | |
223 | st.wDay = (WORD)loctm->tm_mday; | |
224 | st.wHour = (WORD)loctm->tm_hour; | |
225 | st.wMinute = (WORD)loctm->tm_min; | |
226 | st.wSecond = (WORD)loctm->tm_sec; | |
227 | st.wMilliseconds = 0; | |
228 | if (!SystemTimeToFileTime(&st, &locft) || | |
229 | !LocalFileTimeToFileTime(&locft, &modft)) | |
230 | return -1; | |
231 | ||
232 | if (isWinNT < 0) | |
233 | isWinNT = (GetVersion() < 0x80000000) ? 1 : 0; | |
234 | hFile = CreateFile(fname, GENERIC_WRITE, 0, NULL, OPEN_EXISTING, | |
235 | (isWinNT ? FILE_FLAG_BACKUP_SEMANTICS : 0), | |
236 | NULL); | |
237 | if (hFile == INVALID_HANDLE_VALUE) | |
238 | return -1; | |
239 | result = SetFileTime(hFile, NULL, NULL, &modft) ? 0 : -1; | |
240 | CloseHandle(hFile); | |
241 | return result; | |
242 | #else | |
243 | struct utimbuf settime; | |
244 | ||
245 | settime.actime = settime.modtime = ftime; | |
246 | return utime(fname,&settime); | |
247 | #endif | |
248 | } | |
249 | ||
250 | ||
251 | /* push file attributes */ | |
252 | ||
253 | void push_attr(struct attr_item **list,char *fname,int mode,time_t time) | |
254 | { | |
255 | struct attr_item *item; | |
256 | ||
257 | item = (struct attr_item *)malloc(sizeof(struct attr_item)); | |
258 | if (item == NULL) | |
259 | error("Out of memory"); | |
260 | item->fname = strdup(fname); | |
261 | item->mode = mode; | |
262 | item->time = time; | |
263 | item->next = *list; | |
264 | *list = item; | |
265 | } | |
266 | ||
267 | ||
268 | /* restore file attributes */ | |
269 | ||
270 | void restore_attr(struct attr_item **list) | |
271 | { | |
272 | struct attr_item *item, *prev; | |
273 | ||
274 | for (item = *list; item != NULL; ) | |
275 | { | |
276 | setfiletime(item->fname,item->time); | |
277 | chmod(item->fname,item->mode); | |
278 | prev = item; | |
279 | item = item->next; | |
280 | free(prev); | |
281 | } | |
282 | *list = NULL; | |
283 | } | |
284 | ||
285 | ||
286 | /* match regular expression */ | |
287 | ||
288 | #define ISSPECIAL(c) (((c) == '*') || ((c) == '/')) | |
289 | ||
290 | int ExprMatch (char *string,char *expr) | |
291 | { | |
292 | while (1) | |
293 | { | |
294 | if (ISSPECIAL(*expr)) | |
295 | { | |
296 | if (*expr == '/') | |
297 | { | |
298 | if (*string != '\\' && *string != '/') | |
299 | return 0; | |
300 | string ++; expr++; | |
301 | } | |
302 | else if (*expr == '*') | |
303 | { | |
304 | if (*expr ++ == 0) | |
305 | return 1; | |
306 | while (*++string != *expr) | |
307 | if (*string == 0) | |
308 | return 0; | |
309 | } | |
310 | } | |
311 | else | |
312 | { | |
313 | if (*string != *expr) | |
314 | return 0; | |
315 | if (*expr++ == 0) | |
316 | return 1; | |
317 | string++; | |
318 | } | |
319 | } | |
320 | } | |
321 | ||
322 | ||
323 | /* recursive mkdir */ | |
324 | /* abort on ENOENT; ignore other errors like "directory already exists" */ | |
325 | /* return 1 if OK */ | |
326 | /* 0 on error */ | |
327 | ||
328 | int makedir (char *newdir) | |
329 | { | |
330 | char *buffer = strdup(newdir); | |
331 | char *p; | |
332 | int len = strlen(buffer); | |
333 | ||
334 | if (len <= 0) { | |
335 | free(buffer); | |
336 | return 0; | |
337 | } | |
338 | if (buffer[len-1] == '/') { | |
339 | buffer[len-1] = '\0'; | |
340 | } | |
341 | if (mkdir(buffer, 0755) == 0) | |
342 | { | |
343 | free(buffer); | |
344 | return 1; | |
345 | } | |
346 | ||
347 | p = buffer+1; | |
348 | while (1) | |
349 | { | |
350 | char hold; | |
351 | ||
352 | while(*p && *p != '\\' && *p != '/') | |
353 | p++; | |
354 | hold = *p; | |
355 | *p = 0; | |
356 | if ((mkdir(buffer, 0755) == -1) && (errno == ENOENT)) | |
357 | { | |
358 | fprintf(stderr,"%s: Couldn't create directory %s\n",prog,buffer); | |
359 | free(buffer); | |
360 | return 0; | |
361 | } | |
362 | if (hold == 0) | |
363 | break; | |
364 | *p++ = hold; | |
365 | } | |
366 | free(buffer); | |
367 | return 1; | |
368 | } | |
369 | ||
370 | ||
371 | int matchname (int arg,int argc,char **argv,char *fname) | |
372 | { | |
373 | if (arg == argc) /* no arguments given (untgz tgzarchive) */ | |
374 | return 1; | |
375 | ||
376 | while (arg < argc) | |
377 | if (ExprMatch(fname,argv[arg++])) | |
378 | return 1; | |
379 | ||
380 | return 0; /* ignore this for the moment being */ | |
381 | } | |
382 | ||
383 | ||
384 | /* tar file list or extract */ | |
385 | ||
386 | int tar (gzFile in,int action,int arg,int argc,char **argv) | |
387 | { | |
388 | union tar_buffer buffer; | |
389 | int len; | |
390 | int err; | |
391 | int getheader = 1; | |
392 | int remaining = 0; | |
393 | FILE *outfile = NULL; | |
394 | char fname[BLOCKSIZE]; | |
395 | int tarmode; | |
396 | time_t tartime; | |
397 | struct attr_item *attributes = NULL; | |
398 | ||
399 | if (action == TGZ_LIST) | |
400 | printf(" date time size file\n" | |
401 | " ---------- -------- --------- -------------------------------------\n"); | |
402 | while (1) | |
403 | { | |
404 | len = gzread(in, &buffer, BLOCKSIZE); | |
405 | if (len < 0) | |
406 | error(gzerror(in, &err)); | |
407 | /* | |
408 | * Always expect complete blocks to process | |
409 | * the tar information. | |
410 | */ | |
411 | if (len != BLOCKSIZE) | |
412 | { | |
413 | action = TGZ_INVALID; /* force error exit */ | |
414 | remaining = 0; /* force I/O cleanup */ | |
415 | } | |
416 | ||
417 | /* | |
418 | * If we have to get a tar header | |
419 | */ | |
420 | if (getheader >= 1) | |
421 | { | |
422 | /* | |
423 | * if we met the end of the tar | |
424 | * or the end-of-tar block, | |
425 | * we are done | |
426 | */ | |
427 | if (len == 0 || buffer.header.name[0] == 0) | |
428 | break; | |
429 | ||
430 | tarmode = getoct(buffer.header.mode,8); | |
431 | tartime = (time_t)getoct(buffer.header.mtime,12); | |
432 | if (tarmode == -1 || tartime == (time_t)-1) | |
433 | { | |
434 | buffer.header.name[0] = 0; | |
435 | action = TGZ_INVALID; | |
436 | } | |
437 | ||
438 | if (getheader == 1) | |
439 | { | |
440 | strncpy(fname,buffer.header.name,SHORTNAMESIZE); | |
441 | if (fname[SHORTNAMESIZE-1] != 0) | |
442 | fname[SHORTNAMESIZE] = 0; | |
443 | } | |
444 | else | |
445 | { | |
446 | /* | |
447 | * The file name is longer than SHORTNAMESIZE | |
448 | */ | |
449 | if (strncmp(fname,buffer.header.name,SHORTNAMESIZE-1) != 0) | |
450 | error("bad long name"); | |
451 | getheader = 1; | |
452 | } | |
453 | ||
454 | /* | |
455 | * Act according to the type flag | |
456 | */ | |
457 | switch (buffer.header.typeflag) | |
458 | { | |
459 | case DIRTYPE: | |
460 | if (action == TGZ_LIST) | |
461 | printf(" %s <dir> %s\n",strtime(&tartime),fname); | |
462 | if (action == TGZ_EXTRACT) | |
463 | { | |
464 | makedir(fname); | |
465 | push_attr(&attributes,fname,tarmode,tartime); | |
466 | } | |
467 | break; | |
468 | case REGTYPE: | |
469 | case AREGTYPE: | |
470 | remaining = getoct(buffer.header.size,12); | |
471 | if (remaining == -1) | |
472 | { | |
473 | action = TGZ_INVALID; | |
474 | break; | |
475 | } | |
476 | if (action == TGZ_LIST) | |
477 | printf(" %s %9d %s\n",strtime(&tartime),remaining,fname); | |
478 | else if (action == TGZ_EXTRACT) | |
479 | { | |
480 | if (matchname(arg,argc,argv,fname)) | |
481 | { | |
482 | outfile = fopen(fname,"wb"); | |
483 | if (outfile == NULL) { | |
484 | /* try creating directory */ | |
485 | char *p = strrchr(fname, '/'); | |
486 | if (p != NULL) { | |
487 | *p = '\0'; | |
488 | makedir(fname); | |
489 | *p = '/'; | |
490 | outfile = fopen(fname,"wb"); | |
491 | } | |
492 | } | |
493 | if (outfile != NULL) | |
494 | printf("Extracting %s\n",fname); | |
495 | else | |
496 | fprintf(stderr, "%s: Couldn't create %s",prog,fname); | |
497 | } | |
498 | else | |
499 | outfile = NULL; | |
500 | } | |
501 | getheader = 0; | |
502 | break; | |
503 | case GNUTYPE_LONGLINK: | |
504 | case GNUTYPE_LONGNAME: | |
505 | remaining = getoct(buffer.header.size,12); | |
506 | if (remaining < 0 || remaining >= BLOCKSIZE) | |
507 | { | |
508 | action = TGZ_INVALID; | |
509 | break; | |
510 | } | |
511 | len = gzread(in, fname, BLOCKSIZE); | |
512 | if (len < 0) | |
513 | error(gzerror(in, &err)); | |
514 | if (fname[BLOCKSIZE-1] != 0 || (int)strlen(fname) > remaining) | |
515 | { | |
516 | action = TGZ_INVALID; | |
517 | break; | |
518 | } | |
519 | getheader = 2; | |
520 | break; | |
521 | default: | |
522 | if (action == TGZ_LIST) | |
523 | printf(" %s <---> %s\n",strtime(&tartime),fname); | |
524 | break; | |
525 | } | |
526 | } | |
527 | else | |
528 | { | |
529 | unsigned int bytes = (remaining > BLOCKSIZE) ? BLOCKSIZE : remaining; | |
530 | ||
531 | if (outfile != NULL) | |
532 | { | |
533 | if (fwrite(&buffer,sizeof(char),bytes,outfile) != bytes) | |
534 | { | |
535 | fprintf(stderr, | |
536 | "%s: Error writing %s -- skipping\n",prog,fname); | |
537 | fclose(outfile); | |
538 | outfile = NULL; | |
539 | remove(fname); | |
540 | } | |
541 | } | |
542 | remaining -= bytes; | |
543 | } | |
544 | ||
545 | if (remaining == 0) | |
546 | { | |
547 | getheader = 1; | |
548 | if (outfile != NULL) | |
549 | { | |
550 | fclose(outfile); | |
551 | outfile = NULL; | |
552 | if (action != TGZ_INVALID) | |
553 | push_attr(&attributes,fname,tarmode,tartime); | |
554 | } | |
555 | } | |
556 | ||
557 | /* | |
558 | * Abandon if errors are found | |
559 | */ | |
560 | if (action == TGZ_INVALID) | |
561 | { | |
562 | error("broken archive"); | |
563 | break; | |
564 | } | |
565 | } | |
566 | ||
567 | /* | |
568 | * Restore file modes and time stamps | |
569 | */ | |
570 | restore_attr(&attributes); | |
571 | ||
572 | if (gzclose(in) != Z_OK) | |
573 | error("failed gzclose"); | |
574 | ||
575 | return 0; | |
576 | } | |
577 | ||
578 | ||
579 | /* ============================================================ */ | |
580 | ||
581 | void help(int exitval) | |
582 | { | |
583 | printf("untgz version 0.2.1\n" | |
584 | " using zlib version %s\n\n", | |
585 | zlibVersion()); | |
586 | printf("Usage: untgz file.tgz extract all files\n" | |
587 | " untgz file.tgz fname ... extract selected files\n" | |
588 | " untgz -l file.tgz list archive contents\n" | |
589 | " untgz -h display this help\n"); | |
590 | exit(exitval); | |
591 | } | |
592 | ||
593 | void error(const char *msg) | |
594 | { | |
595 | fprintf(stderr, "%s: %s\n", prog, msg); | |
596 | exit(1); | |
597 | } | |
598 | ||
599 | ||
600 | /* ============================================================ */ | |
601 | ||
602 | #if defined(WIN32) && defined(__GNUC__) | |
603 | int _CRT_glob = 0; /* disable argument globbing in MinGW */ | |
604 | #endif | |
605 | ||
606 | int main(int argc,char **argv) | |
607 | { | |
608 | int action = TGZ_EXTRACT; | |
609 | int arg = 1; | |
610 | char *TGZfile; | |
611 | gzFile *f; | |
612 | ||
613 | prog = strrchr(argv[0],'\\'); | |
614 | if (prog == NULL) | |
615 | { | |
616 | prog = strrchr(argv[0],'/'); | |
617 | if (prog == NULL) | |
618 | { | |
619 | prog = strrchr(argv[0],':'); | |
620 | if (prog == NULL) | |
621 | prog = argv[0]; | |
622 | else | |
623 | prog++; | |
624 | } | |
625 | else | |
626 | prog++; | |
627 | } | |
628 | else | |
629 | prog++; | |
630 | ||
631 | if (argc == 1) | |
632 | help(0); | |
633 | ||
634 | if (strcmp(argv[arg],"-l") == 0) | |
635 | { | |
636 | action = TGZ_LIST; | |
637 | if (argc == ++arg) | |
638 | help(0); | |
639 | } | |
640 | else if (strcmp(argv[arg],"-h") == 0) | |
641 | { | |
642 | help(0); | |
643 | } | |
644 | ||
645 | if ((TGZfile = TGZfname(argv[arg])) == NULL) | |
646 | TGZnotfound(argv[arg]); | |
647 | ||
648 | ++arg; | |
649 | if ((action == TGZ_LIST) && (arg != argc)) | |
650 | help(1); | |
651 | ||
652 | /* | |
653 | * Process the TGZ file | |
654 | */ | |
655 | switch(action) | |
656 | { | |
657 | case TGZ_LIST: | |
658 | case TGZ_EXTRACT: | |
659 | f = gzopen(TGZfile,"rb"); | |
660 | if (f == NULL) | |
661 | { | |
662 | fprintf(stderr,"%s: Couldn't gzopen %s\n",prog,TGZfile); | |
663 | return 1; | |
664 | } | |
665 | exit(tar(f, action, arg, argc, argv)); | |
666 | break; | |
667 | ||
668 | default: | |
669 | error("Unknown option"); | |
670 | exit(1); | |
671 | } | |
672 | ||
673 | return 0; | |
674 | } |