home *** CD-ROM | disk | FTP | other *** search
- /* unship.c -- for unpacking ship files via trn */
- /* Based on ship.c -- Not copyrighted 1991 Mark Adler. */
- /* Modified by Wayne Davison, but still not copyrighted. */
-
- #include "EXTERN.h"
- #include "common.h"
- #include "respond.h"
- #include "decode.h"
-
- typedef unsigned long ulg; /* 32-bit unsigned integer */
-
- /* Function prototypes */
-
- static void decode_line ANSI((unsigned char *));
- static void err ANSI((int));
-
- /* Globals for ship() */
- ulg ccnt; /* count of bytes read or written */
- ulg crc; /* CRC register */
- ulg buf4; /* four byte buffer */
- int bcnt; /* buffer count */
-
- unsigned int decb; /* bit buffer for decode */
- unsigned int decn; /* number of bits in decb */
-
- bool fast; /* true for arithmetic coding, else base 85 */
- bool overwrite = 1; /* should we overwrite existing files? */
-
- /* Errors */
- #define SE_FORM 1
- #define SE_CONT 2
- #define SE_CRC 3
- #define SE_OVER 4
- #define SE_FULL 5
- char *errors[] = {
- /* 1 */ "Invalid ship format.",
- /* 2 */ "This piece is out of sequence.",
- /* 3 */ "CRC check failed.",
- /* 4 */ "File already exists.",
- /* 5 */ "Error writing file.",
- };
-
- /* Set of 86 characters used for the base 85 digits (last one not used), and
- the 86 character arithmetic coding. Selected to be part of both the ASCII
- printable characters, and the common EBCDIC printable characters whose
- ASCII translations are universal. */
- unsigned char safe[] = {
- '{','"','#','$','%','&','\'','(',')','*','+',',','-','.','/',
- '0','1','2','3','4','5','6','7','8','9',':',';','<','=','>','?','@',
- 'A','B','C','D','E','F','G','H','I','J','K','L','M',
- 'N','O','P','Q','R','S','T','U','V','W','X','Y','Z','_',
- 'a','b','c','d','e','f','g','h','i','j','k','l','m',
- 'n','o','p','q','r','s','t','u','v','w','x','y','z','}'};
-
- #define LOWSZ (sizeof(safe)-64) /* low set size for fast coding */
-
- /* Special replacement pairs--if first of each pair is received, it is
- treated like the second member of the pair. You're probably
- wondering why. The first pair is for compatibility with an
- earlier version of ship that used ! for the base 85 zero digit.
- However, there exist ASCII-EBCDIC translation tables that don't
- know about exclamation marks. The second set has mysterious
- historical origins that are best left unspoken ... */
- unsigned char aliases[] = {'!','{','|','+',0};
-
- /* Inverse of safe[], filled in by unship_init() */
- unsigned char invsafe[256];
-
- /* Table of CRC-32's of all single byte values (made by makecrc.c) */
- ulg crctab[] = {
- 0x00000000L, 0x77073096L, 0xee0e612cL, 0x990951baL, 0x076dc419L,
- 0x706af48fL, 0xe963a535L, 0x9e6495a3L, 0x0edb8832L, 0x79dcb8a4L,
- 0xe0d5e91eL, 0x97d2d988L, 0x09b64c2bL, 0x7eb17cbdL, 0xe7b82d07L,
- 0x90bf1d91L, 0x1db71064L, 0x6ab020f2L, 0xf3b97148L, 0x84be41deL,
- 0x1adad47dL, 0x6ddde4ebL, 0xf4d4b551L, 0x83d385c7L, 0x136c9856L,
- 0x646ba8c0L, 0xfd62f97aL, 0x8a65c9ecL, 0x14015c4fL, 0x63066cd9L,
- 0xfa0f3d63L, 0x8d080df5L, 0x3b6e20c8L, 0x4c69105eL, 0xd56041e4L,
- 0xa2677172L, 0x3c03e4d1L, 0x4b04d447L, 0xd20d85fdL, 0xa50ab56bL,
- 0x35b5a8faL, 0x42b2986cL, 0xdbbbc9d6L, 0xacbcf940L, 0x32d86ce3L,
- 0x45df5c75L, 0xdcd60dcfL, 0xabd13d59L, 0x26d930acL, 0x51de003aL,
- 0xc8d75180L, 0xbfd06116L, 0x21b4f4b5L, 0x56b3c423L, 0xcfba9599L,
- 0xb8bda50fL, 0x2802b89eL, 0x5f058808L, 0xc60cd9b2L, 0xb10be924L,
- 0x2f6f7c87L, 0x58684c11L, 0xc1611dabL, 0xb6662d3dL, 0x76dc4190L,
- 0x01db7106L, 0x98d220bcL, 0xefd5102aL, 0x71b18589L, 0x06b6b51fL,
- 0x9fbfe4a5L, 0xe8b8d433L, 0x7807c9a2L, 0x0f00f934L, 0x9609a88eL,
- 0xe10e9818L, 0x7f6a0dbbL, 0x086d3d2dL, 0x91646c97L, 0xe6635c01L,
- 0x6b6b51f4L, 0x1c6c6162L, 0x856530d8L, 0xf262004eL, 0x6c0695edL,
- 0x1b01a57bL, 0x8208f4c1L, 0xf50fc457L, 0x65b0d9c6L, 0x12b7e950L,
- 0x8bbeb8eaL, 0xfcb9887cL, 0x62dd1ddfL, 0x15da2d49L, 0x8cd37cf3L,
- 0xfbd44c65L, 0x4db26158L, 0x3ab551ceL, 0xa3bc0074L, 0xd4bb30e2L,
- 0x4adfa541L, 0x3dd895d7L, 0xa4d1c46dL, 0xd3d6f4fbL, 0x4369e96aL,
- 0x346ed9fcL, 0xad678846L, 0xda60b8d0L, 0x44042d73L, 0x33031de5L,
- 0xaa0a4c5fL, 0xdd0d7cc9L, 0x5005713cL, 0x270241aaL, 0xbe0b1010L,
- 0xc90c2086L, 0x5768b525L, 0x206f85b3L, 0xb966d409L, 0xce61e49fL,
- 0x5edef90eL, 0x29d9c998L, 0xb0d09822L, 0xc7d7a8b4L, 0x59b33d17L,
- 0x2eb40d81L, 0xb7bd5c3bL, 0xc0ba6cadL, 0xedb88320L, 0x9abfb3b6L,
- 0x03b6e20cL, 0x74b1d29aL, 0xead54739L, 0x9dd277afL, 0x04db2615L,
- 0x73dc1683L, 0xe3630b12L, 0x94643b84L, 0x0d6d6a3eL, 0x7a6a5aa8L,
- 0xe40ecf0bL, 0x9309ff9dL, 0x0a00ae27L, 0x7d079eb1L, 0xf00f9344L,
- 0x8708a3d2L, 0x1e01f268L, 0x6906c2feL, 0xf762575dL, 0x806567cbL,
- 0x196c3671L, 0x6e6b06e7L, 0xfed41b76L, 0x89d32be0L, 0x10da7a5aL,
- 0x67dd4accL, 0xf9b9df6fL, 0x8ebeeff9L, 0x17b7be43L, 0x60b08ed5L,
- 0xd6d6a3e8L, 0xa1d1937eL, 0x38d8c2c4L, 0x4fdff252L, 0xd1bb67f1L,
- 0xa6bc5767L, 0x3fb506ddL, 0x48b2364bL, 0xd80d2bdaL, 0xaf0a1b4cL,
- 0x36034af6L, 0x41047a60L, 0xdf60efc3L, 0xa867df55L, 0x316e8eefL,
- 0x4669be79L, 0xcb61b38cL, 0xbc66831aL, 0x256fd2a0L, 0x5268e236L,
- 0xcc0c7795L, 0xbb0b4703L, 0x220216b9L, 0x5505262fL, 0xc5ba3bbeL,
- 0xb2bd0b28L, 0x2bb45a92L, 0x5cb36a04L, 0xc2d7ffa7L, 0xb5d0cf31L,
- 0x2cd99e8bL, 0x5bdeae1dL, 0x9b64c2b0L, 0xec63f226L, 0x756aa39cL,
- 0x026d930aL, 0x9c0906a9L, 0xeb0e363fL, 0x72076785L, 0x05005713L,
- 0x95bf4a82L, 0xe2b87a14L, 0x7bb12baeL, 0x0cb61b38L, 0x92d28e9bL,
- 0xe5d5be0dL, 0x7cdcefb7L, 0x0bdbdf21L, 0x86d3d2d4L, 0xf1d4e242L,
- 0x68ddb3f8L, 0x1fda836eL, 0x81be16cdL, 0xf6b9265bL, 0x6fb077e1L,
- 0x18b74777L, 0x88085ae6L, 0xff0f6a70L, 0x66063bcaL, 0x11010b5cL,
- 0x8f659effL, 0xf862ae69L, 0x616bffd3L, 0x166ccf45L, 0xa00ae278L,
- 0xd70dd2eeL, 0x4e048354L, 0x3903b3c2L, 0xa7672661L, 0xd06016f7L,
- 0x4969474dL, 0x3e6e77dbL, 0xaed16a4aL, 0xd9d65adcL, 0x40df0b66L,
- 0x37d83bf0L, 0xa9bcae53L, 0xdebb9ec5L, 0x47b2cf7fL, 0x30b5ffe9L,
- 0xbdbdf21cL, 0xcabac28aL, 0x53b39330L, 0x24b4a3a6L, 0xbad03605L,
- 0xcdd70693L, 0x54de5729L, 0x23d967bfL, 0xb3667a2eL, 0xc4614ab8L,
- 0x5d681b02L, 0x2a6f2b94L, 0xb40bbe37L, 0xc30c8ea1L, 0x5a05df1bL,
- 0x2d02ef8dL
- };
-
- /* Macro to update the CRC shift register one byte at a time */
- #define CRC(c,b) (crctab[((int)(c)^(int)(b))&0xff]^((c)>>8))
-
- /* cputc(d,x)--like putc(d,f), but delays four bytes and computes a CRC.
- x is a cfile *, and d is expected to be an ulg. */
- #define cputf(fp) (int)(crc=CRC(crc,buf4),putc((int)buf4&0xff,fp),ccnt++)
- #define cputc(d,fp) (bcnt!=4?bcnt++:cputf(fp),buf4=(buf4>>8)+((ulg)(d)<<24))
-
- /* Build invsafe[], the inverse of safe[]. */
- void
- unship_init()
- {
- int i;
-
- for (i = 0; i < 256; i++)
- invsafe[i] = 127;
- for (i = 0; i < sizeof(safe); i++)
- invsafe[safe[i]] = (char)i;
- for (i = 0; aliases[i]; i += 2)
- invsafe[aliases[i]] = invsafe[aliases[i + 1]];
- }
-
- int
- unship(in)
- FILE *in;
- {
- int b; /* state of line loop */
- char l[LBUFLEN]; /* line buffer on input */
- int counter; /** OS2-patch **/
- char *p; /* modifies line buffer */
- char *q; /* scans continuation line */
-
- /* Loop on the latest article's lines */
- b = 2; /* not in body yet */
- while (1) /* return on end of last file */
- {
- /* Get next line from file */
- if (fgets(l, LBUFLEN, in) == Nullch)
- break;
-
- /*** OS2: AAAAAAAAHHHHHHHHHHHH, ..... another problem with \r (^M)... **/
-
- for (counter = 0; counter <= strlen(l); counter++)
- if ((l[counter] == '\r') &&
- (l[counter+1] == '\n')) {
- for (; l[counter] != '\0'; counter++)
- l[counter] = l[counter+1];
- }
-
- /* Strip control characters and leading blank space, if any */
- for (q = l; *q && *q <= ' ' && *q != '\n'; q++)
- ;
- for (p = l; *q; q++)
- if (*q >= ' ' || *q == '\n')
- *p++ = *q;
- *p = 0;
-
- /* Based on current state, end or start on terminator. States are:
- b == 0: at start of body or body terminator line
- b == 1: in middle of body line
- b == 2: at start of non-body line
- b == 3: in middle of non-body line
- b == 4: at information line
- */
- switch (b)
- {
- case 0:
- if ((!fast && strEQ(l, "$\n")) ||
- (fast && strEQ(l, "$ f\n")))
- {
- b = 4;
- break;
- }
- /* fall through to case 1 */
- case 1:
- decode_line((unsigned char *)l);
- b = l[strlen(l) - 1] != '\n';
- break;
- case 2:
- if (strEQ(l, "$\n") || strEQ(l, "$ f\n"))
- {
- fast = l[1] == ' ';
- b = 4;
- break;
- }
- /* fall through to case 3 */
- case 3:
- b = l[strlen(l)-1] == '\n' ? 2 : 3;
- break;
- case 4:
- /* Possible information lines are ship, more, cont, and end */
- if (l[b = strlen(l) - 1] != '\n')
- {
- err(SE_FORM);
- decode_end();
- return -1;
- }
- l[b] = 0;
- if (strnEQ(l, "ship ", 5))
- {
- /* get name, open new output file */
- if (decode_fp != Nullfp)
- decode_end(); /* outputs an "incomplete" warning */
- if (strEQ(l + 5, "-"))
- strcpy(decode_fname, "unnamed");
- else
- strcpy(decode_fname, l + 5);
- sprintf(decode_dest, "%s/%s", extractdest, decode_fname);
- printf("Decoding: %s\n", decode_fname);
- #ifndef VMS /* shouldn't have explicit version #, so VMS won't overwrite */
- if (!overwrite && (decode_fp = fos2open(decode_dest, "r")) != Nullfp)
- {
- fclose(decode_fp);
- decode_fp = Nullfp;
- err(SE_OVER);
- return -1;
- }
- #endif /* !VMS */
- if ((decode_fp = fos2open(decode_dest, FOPEN_WB)) == Nullfp)
- {
- err(SE_FULL);
- return -1;
- }
- crc = 0xffffffffL; /* preload CRC register */
- buf4 = 0; /* empty fifo (for output) */
- bcnt = 0; /* fifo is empty (output) */
- b = decb = decn = 0;
- ccnt = 0;
- }
- else if (strEQ(l, "more"))
- {
- /* check if currently writing */
- if (decode_fp == Nullfp)
- {
- err(SE_FORM);
- return -1;
- }
- b = 2;
- }
- else if (strnEQ(l, "cont ", 5))
- {
- /* check name and file offset */
- if (decode_fp == Nullfp)
- {
- err(SE_CONT);
- return -1;
- }
- for (q = l + 5; *q && *q != ' '; q++)
- ;
- if (*q == 0 || atol(l + 5) != ccnt + 4 + (decn != 0) ||
- strNE(q + 1, decode_fname))
- {
- err(SE_CONT);
- return -1;
- }
- b = 0;
- }
- else if (strcmp(l, "end") == 0)
- {
- /* check crc, close output file */
- if (decode_fp == Nullfp)
- {
- err(SE_FORM);
- return -1;
- }
- if (bcnt != 4 || buf4 != ~crc)
- err(SE_CRC);
- else
- printf("CRC verified -- Done.\n");
- if (ferror(decode_fp) || fclose(decode_fp))
- {
- err(SE_FULL);
- decode_end();
- return -1;
- }
- decode_fp = Nullfp;
- b = 2;
- }
- else
- {
- for (q = l; *q && *q != ' '; q++)
- ;
- *q = 0;
- printf("Ignoring unsupported ship keyword: '%s'\n", l);
- b = 4;
- }
- break;
- }
- }
- if (!(b & 2)) {
- err(SE_FORM);
- return -1;
- }
- if (decode_fp)
- printf("(Continued)\n");
- return 0;
- }
-
- /* Decode s, a string of base 85 digits or, if fast is true, a string of safe
- characters generated arithmetically, into its binary equivalent, writing
- the result to decode_fp, using cputc(). */
- static void
- decode_line(s)
- unsigned char *s; /* data to decode */
- {
- int b; /* state of line loop, next character */
- int k; /* counts bits or digits read */
- /* powers of 85 table for decoding */
- static ulg m[] = {1L,85L,85L*85L,85L*85L*85L,85L*85L*85L*85L};
-
- if (fast)
- {
- unsigned int d; /* disperses bits */
-
- d = decb;
- k = decn;
- while ((b = *s++) != 0)
- if ((b = invsafe[b]) < sizeof(safe))
- {
- if (b < LOWSZ)
- {
- d |= b << k;
- k += 7;
- }
- else if ((b -= LOWSZ) < LOWSZ)
- {
- d |= (b + 0x40) << k;
- k += 7;
- }
- else
- {
- d |= b << k;
- k += 6;
- }
- if (k >= 8)
- {
- cputc(d, decode_fp);
- d >>= 8;
- k -= 8;
- }
- }
- decb = d;
- decn = k;
- }
- else
- {
- ulg d; /* disperses bytes */
-
- d = k = 0;
- while ((b = *s++) != 0)
- if ((b = invsafe[b]) < 85)
- {
- d += m[k] * b;
- if (++k == 5)
- {
- cputc(d, decode_fp); d >>= 8;
- cputc(d, decode_fp); d >>= 8;
- cputc(d, decode_fp); d >>= 8;
- cputc(d, decode_fp);
- d = k = 0;
- }
- }
- if (--k > 0)
- {
- while (--k)
- {
- cputc(d, decode_fp);
- d >>= 8;
- }
- cputc(d, decode_fp);
- }
- }
- }
-
- static void
- err(n)
- int n; /* error number */
- {
- if (n == SE_FULL)
- perror("ship");
- fputs(errors[n - 1], stdout);
- putchar('\n') ; FLUSH;
- }
-