libclamav/unzip.c
50593e02
 /*
2023340a
  *  Copyright (C) 2007-2008 Sourcefire, Inc.
  *
  *  Authors: Alberto Wu
50593e02
  *
  *  This program is free software; you can redistribute it and/or modify
  *  it under the terms of the GNU General Public License version 2 as
  *  published by the Free Software Foundation.
  *
  *  This program is distributed in the hope that it will be useful,
  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  *  GNU General Public License for more details.
  *
  *  You should have received a copy of the GNU General Public License
  *  along with this program; if not, write to the Free Software
  *  Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
  *  MA 02110-1301, USA.
  */
 
 /* FIXME: get a clue about masked stuff */
 
 #if HAVE_CONFIG_H
 #include "clamav-config.h"
 #endif
 
 #include <sys/types.h>
 #include <sys/stat.h>
 #include <fcntl.h>
 #ifdef HAVE_UNISTD_H
 #include <unistd.h>
 #endif
 #if HAVE_STRING_H
 #include <string.h>
 #endif
 #include <stdlib.h>
 #include <stdio.h>
 
 #include <zlib.h>
 #include "inflate64.h"
 #if HAVE_BZLIB_H
 #include <bzlib.h>
 #endif
 
f8be651b
 #include "explode.h"
50593e02
 #include "others.h"
 #include "clamav.h"
 #include "scanners.h"
 #include "matcher.h"
774898a7
 #include "fmap.h"
50593e02
 
 #define UNZIP_PRIVATE
 #include "unzip.h"
 
 static int wrap_inflateinit2(void *a, int b) {
   return inflateInit2(a, b);
 }
 
f8be651b
 static int unz(uint8_t *src, uint32_t csize, uint32_t usize, uint16_t method, uint16_t flags, unsigned int *fu, cli_ctx *ctx, char *tmpd) {
50593e02
   char name[1024], obuf[BUFSIZ];
   char *tempfile = name;
   int of, ret=CL_CLEAN;
   unsigned int res=1, written=0;
 
   if(tmpd) {
58481352
     snprintf(name, sizeof(name), "%s"PATHSEP"zip.%03u", tmpd, *fu);
50593e02
     name[sizeof(name)-1]='\0';
   } else {
33068e09
     if(!(tempfile = cli_gentemp(ctx->engine->tmpdir))) return CL_EMEM;
50593e02
   }
   if((of = open(tempfile, O_RDWR|O_CREAT|O_TRUNC|O_BINARY, S_IRUSR|S_IWUSR))==-1) {
     cli_warnmsg("cli_unzip: failed to create temporary file %s\n", tempfile);
     if(!tmpd) free(tempfile);
871177cd
     return CL_ECREAT;
50593e02
   }
   switch (method) {
   case ALG_STORED:
     if(csize<usize) {
       unsigned int fake = *fu + 1;
       cli_dbgmsg("cli_unzip: attempting to inflate stored file with inconsistent size\n");
f8be651b
       if ((ret=unz(src, csize, usize, ALG_DEFLATE, 0, &fake, ctx, tmpd))==CL_CLEAN) {
50593e02
 	(*fu)++;
 	res=fake-(*fu);
       }
       else break;
     }
     if(res==1) {
724b2bf7
       if(ctx->engine->maxfilesize && csize > ctx->engine->maxfilesize) {
e78b5186
 	cli_dbgmsg("cli_unzip: trimming output size to maxfilesize (%lu)\n", (long unsigned int) ctx->engine->maxfilesize);
724b2bf7
 	csize = ctx->engine->maxfilesize;
50593e02
       }
871177cd
       if(cli_writen(of, src, csize)!=(int)csize) ret = CL_EWRITE;
50593e02
       else res=0;
     }
     break;
 
   case ALG_DEFLATE:
   case ALG_DEFLATE64: {
     union {
       z_stream64 strm64;
       z_stream strm;
     } strm;
     typedef int (*unz_init_) (void *, int);
     typedef int (*unz_unz_) (void *, int);
     typedef int (*unz_end_) (void *);
     unz_init_ unz_init;
     unz_unz_ unz_unz;
     unz_end_ unz_end;
     int wbits;
     void **next_in;
     void **next_out;
     unsigned int *avail_in;
     unsigned int *avail_out;
 
     if(method == ALG_DEFLATE64) {
       unz_init = (unz_init_)inflate64Init2;
       unz_unz = (unz_unz_)inflate64;
       unz_end = (unz_end_)inflate64End;
       next_in = (void *)&strm.strm64.next_in;
       next_out = (void *)&strm.strm64.next_out;
       avail_in = &strm.strm64.avail_in;
       avail_out = &strm.strm64.avail_out;
       wbits=MAX_WBITS64;
     } else {
       unz_init = (unz_init_)wrap_inflateinit2;
       unz_unz = (unz_unz_)inflate;
       unz_end = (unz_end_)inflateEnd;
       next_in = (void *)&strm.strm.next_in;
       next_out = (void *)&strm.strm.next_out;
       avail_in = &strm.strm.avail_in;
       avail_out = &strm.strm.avail_out;
       wbits=MAX_WBITS;
     }
 
     memset(&strm, 0, sizeof(strm));
 
     *next_in = src;
     *next_out = obuf;
     *avail_in = csize;
     *avail_out = sizeof(obuf);
     if (unz_init(&strm, -wbits)!=Z_OK) {
       cli_dbgmsg("cli_unzip: zinit failed\n");
       break;
     }
     while(1) {
       while((res = unz_unz(&strm, Z_NO_FLUSH))==Z_OK) {};
       if(*avail_out!=sizeof(obuf)) {
 	written+=sizeof(obuf)-(*avail_out);
724b2bf7
 	if(ctx->engine->maxfilesize && written > ctx->engine->maxfilesize) {
e78b5186
 	  cli_dbgmsg("cli_unzip: trimming output size to maxfilesize (%lu)\n", (long unsigned int) ctx->engine->maxfilesize);
50593e02
 	  res = Z_STREAM_END;
 	  break;
 	}
 	if(cli_writen(of, obuf, sizeof(obuf)-(*avail_out)) != (int)(sizeof(obuf)-(*avail_out))) {
 	  cli_warnmsg("cli_unzip: falied to write %lu inflated bytes\n", sizeof(obuf)-(*avail_out));
871177cd
 	  ret = CL_EWRITE;
b346e362
 	  res = 100;
 	  break;
50593e02
 	}
 	*next_out = obuf;
 	*avail_out = sizeof(obuf);
 	continue;
       }
       break;
     }
     unz_end(&strm);
     if (res == Z_STREAM_END) res=0;
     break;
   }
 
 
 #if HAVE_BZLIB_H
c09deba1
 #ifdef NOBZ2PREFIX
a622f5f3
 #define BZ2_bzDecompress bzDecompress
 #define BZ2_bzDecompressEnd bzDecompressEnd
 #define BZ2_bzDecompressInit bzDecompressInit
c09deba1
 #endif
 
50593e02
   case ALG_BZIP2: {
     bz_stream strm;
     memset(&strm, 0, sizeof(strm));
     strm.next_in = (char *)src;
     strm.next_out = obuf;
     strm.avail_in = csize;
     strm.avail_out = sizeof(obuf);
     if (BZ2_bzDecompressInit(&strm, 0, 0)!=BZ_OK) {
       cli_dbgmsg("cli_unzip: bzinit failed\n");
       break;
     }
     while((res = BZ2_bzDecompress(&strm))==BZ_OK || res==BZ_STREAM_END) {
       if(strm.avail_out!=sizeof(obuf)) {
 	written+=sizeof(obuf)-strm.avail_out;
724b2bf7
 	if(ctx->engine->maxfilesize && written > ctx->engine->maxfilesize) {
e78b5186
 	  cli_dbgmsg("cli_unzip: trimming output size to maxfilesize (%lu)\n", (unsigned long int) ctx->engine->maxfilesize);
f8be651b
 	  res = BZ_STREAM_END;
50593e02
 	  break;
 	}
 	if(cli_writen(of, obuf, sizeof(obuf)-strm.avail_out) != (int)(sizeof(obuf)-strm.avail_out)) {
 	  cli_warnmsg("cli_unzip: falied to write %lu bunzipped bytes\n", sizeof(obuf)-strm.avail_out);
871177cd
 	  ret = CL_EWRITE;
b346e362
 	  res = 100;
 	  break;
50593e02
 	}
 	strm.next_out = obuf;
 	strm.avail_out = sizeof(obuf);
b346e362
 	if (res == BZ_OK) continue; /* after returning BZ_STREAM_END once, decompress returns an error */
50593e02
       }
       break;
     }
     BZ2_bzDecompressEnd(&strm);
b346e362
     if (res == BZ_STREAM_END) res=0;
50593e02
     break;
   }
 #endif /* HAVE_BZLIB_H */
 
f8be651b
 
   case ALG_IMPLODE: {
     struct xplstate strm;
7e05c025
     strm.next_in = src;
     strm.next_out = (uint8_t *)obuf;
f8be651b
     strm.avail_in = csize;
     strm.avail_out = sizeof(obuf);
     if (explode_init(&strm, flags)!=EXPLODE_OK) {
       cli_dbgmsg("cli_unzip: explode_init() failed\n");
       break;
     }
     while((res = explode(&strm))==EXPLODE_OK) {
       if(strm.avail_out!=sizeof(obuf)) {
 	written+=sizeof(obuf)-strm.avail_out;
724b2bf7
 	if(ctx->engine->maxfilesize && written > ctx->engine->maxfilesize) {
e78b5186
 	  cli_dbgmsg("cli_unzip: trimming output size to maxfilesize (%lu)\n", (unsigned long int) ctx->engine->maxfilesize);
f8be651b
 	  res = 0;
 	  break;
 	}
 	if(cli_writen(of, obuf, sizeof(obuf)-strm.avail_out) != (int)(sizeof(obuf)-strm.avail_out)) {
 	  cli_warnmsg("cli_unzip: falied to write %lu exploded bytes\n", sizeof(obuf)-strm.avail_out);
871177cd
 	  ret = CL_EWRITE;
b346e362
 	  res = 100;
 	  break;
f8be651b
 	}
7e05c025
 	strm.next_out = (uint8_t *)obuf;
f8be651b
 	strm.avail_out = sizeof(obuf);
 	continue;
       }
       break;
     }
     break;
   }
 
 
50593e02
   case ALG_LZMA:
     /* easy but there's not a single sample in the zoo */
 
 #if !HAVE_BZLIB_H
   case ALG_BZIP2:
 #endif
   case ALG_SHRUNK:
   case ALG_REDUCE1:
   case ALG_REDUCE2:
   case ALG_REDUCE3:
   case ALG_REDUCE4:
   case ALG_TOKENZD:
   case ALG_OLDTERSE:
   case ALG_RSVD1:
   case ALG_RSVD2:
   case ALG_RSVD3:
   case ALG_RSVD4:
   case ALG_RSVD5:
   case ALG_NEWTERSE:
   case ALG_LZ77:
   case ALG_WAVPACK:
   case ALG_PPMD:
     cli_dbgmsg("cli_unzip: unsupported method (%d)\n", method);
     break;
   default:
     cli_dbgmsg("cli_unzip: unknown method (%d)\n", method);
     break;
   }
 
   if(!res) {
     (*fu)++;
     cli_dbgmsg("cli_unzip: extracted to %s\n", tempfile);
     lseek(of, 0, SEEK_SET);
     ret = cli_magic_scandesc(of, ctx);
     close(of);
33068e09
     if(!ctx->engine->keeptmp)
871177cd
       if(cli_unlink(tempfile)) ret = CL_EUNLINK;
50593e02
     if(!tmpd) free(tempfile);
     return ret;
   }
 
   close(of);
33068e09
   if(!ctx->engine->keeptmp)
871177cd
     if(cli_unlink(tempfile)) ret = CL_EUNLINK;
50593e02
   if(!tmpd) free(tempfile);
   cli_dbgmsg("cli_unzip: extraction failed\n");
   return ret;
 }
 
4bf5eb79
 static unsigned int lhdr(fmap_t *map, uint32_t loff,uint32_t zsize, unsigned int *fu, unsigned int fc, uint8_t *ch, int *ret, cli_ctx *ctx, char *tmpd, int detect_encrypted) {
774898a7
   uint8_t *lh, *zip;
50593e02
   char name[256];
e5083cb5
   uint32_t csize, usize;
50593e02
 
774898a7
   if(!(lh = fmap_need_off(map, loff, SIZEOF_LH))) {
       cli_dbgmsg("cli_unzip: lh - out of file\n");
       return 0;
50593e02
   }
   if(LH_magic != 0x04034b50) {
     if (!ch) cli_dbgmsg("cli_unzip: lh - wrkcomplete\n");
     else cli_dbgmsg("cli_unzip: lh - bad magic\n");
774898a7
     fmap_unneed_off(map, loff, SIZEOF_LH);
50593e02
     return 0;
   }
 
774898a7
   zip = lh + SIZEOF_LH;
50593e02
   zsize-=SIZEOF_LH;
 
   if(zsize<=LH_flen) {
     cli_dbgmsg("cli_unzip: lh - fname out of file\n");
b183aa78
     fmap_unneed_off(map, loff, SIZEOF_LH);
50593e02
     return 0;
   }
15f413d1
   if(ctx->engine->cdb || cli_debug_flag) {
774898a7
       uint32_t nsize = (LH_flen>=sizeof(name))?sizeof(name)-1:LH_flen;
       char *src;
       if(nsize && (src = fmap_need_ptr_once(map, zip, nsize))) {
 	  memcpy(name, zip, nsize);
 	  name[nsize]='\0';
       } else
 	  name[0] = '\0';
50593e02
   }
   zip+=LH_flen;
   zsize-=LH_flen;
 
3145cde0
   cli_dbgmsg("cli_unzip: lh - ZMDNAME:%d:%s:%u:%u:%x:%u:%u:%u\n", ((LH_flags & F_ENCR)!=0), name, LH_usize, LH_csize, LH_crc32, LH_method, fc, ctx->recursion);
50593e02
   /* ZMDfmt virname:encrypted(0-1):filename(exact|*):usize(exact|*):csize(exact|*):crc32(exact|*):method(exact|*):fileno(exact|*):maxdepth(exact|*) */
 
570b1d00
   if(cli_matchmeta(ctx, name, LH_csize, LH_usize, (LH_flags & F_ENCR)!=0, fc, LH_crc32, NULL) == CL_VIRUS) {
6416cdef
     *ret = CL_VIRUS;
50593e02
     return 0;
   }
 
   if(LH_flags & F_MSKED) {
     cli_dbgmsg("cli_unzip: lh - header has got unusable masked data\n");
     /* FIXME: need to find/craft a sample */
b183aa78
     fmap_unneed_off(map, loff, SIZEOF_LH);
50593e02
     return 0;
   }
 
4bf5eb79
   if(detect_encrypted && (LH_flags & F_ENCR) && DETECT_ENCRYPTED) {
8201d79d
     cli_dbgmsg("cli_unzip: Encrypted files found in archive.\n");
fb0a54dd
     cli_append_virus(ctx, "Heuristics.Encrypted.Zip");
8201d79d
     *ret = CL_VIRUS;
b183aa78
     fmap_unneed_off(map, loff, SIZEOF_LH);
8201d79d
     return 0;
   }
  
50593e02
   if(LH_flags & F_USEDD) {
     cli_dbgmsg("cli_unzip: lh - has data desc\n");
774898a7
     if(!ch) {
b183aa78
 	fmap_unneed_off(map, loff, SIZEOF_LH);
774898a7
 	return 0;
     }
e5083cb5
     else { usize = CH_usize; csize = CH_csize; }
   } else { usize = LH_usize; csize = LH_csize; }
50593e02
 
   if(zsize<=LH_elen) {
     cli_dbgmsg("cli_unzip: lh - extra out of file\n");
b183aa78
     fmap_unneed_off(map, loff, SIZEOF_LH);
50593e02
     return 0;
   }
   zip+=LH_elen;
   zsize-=LH_elen;
 
   if (!csize) { /* FIXME: what's used for method0 files? csize or usize? Nothing in the specs, needs testing */
774898a7
       cli_dbgmsg("cli_unzip: lh - skipping empty file\n");
50593e02
   } else {
774898a7
       if(zsize<csize) {
 	  cli_dbgmsg("cli_unzip: lh - stream out of file\n");
b183aa78
 	  fmap_unneed_off(map, loff, SIZEOF_LH);
774898a7
 	  return 0;
       }
       if(LH_flags & F_ENCR) {
 	  cli_dbgmsg("cli_unzip: lh - skipping encrypted file\n");
       } else {
 	  if(fmap_need_ptr_once(map, zip, csize))
 	      *ret = unz(zip, csize, usize, LH_method, LH_flags, fu, ctx, tmpd);
       }
       zip+=csize;
       zsize-=csize;
50593e02
   }
 
b183aa78
   fmap_unneed_off(map, loff, SIZEOF_LH); /* unneed now. block is guaranteed to exists till the next need */
50593e02
   if(LH_flags & F_USEDD) {
774898a7
       if(zsize<12) {
 	  cli_dbgmsg("cli_unzip: lh - data desc out of file\n");
 	  return 0;
50593e02
       }
774898a7
       zsize-=12;
       if(fmap_need_ptr_once(map, zip, 4)) {
 	  if(cli_readint32(zip)==0x08074b50) {
 	      if(zsize<4) {
 		  cli_dbgmsg("cli_unzip: lh - data desc out of file\n");
 		  return 0;
 	      }
 	      zip+=4;
 	  }
       }
       zip+=12;
50593e02
   }
   return zip-lh;
 }
 
 
49cc1e3c
 static unsigned int chdr(fmap_t *map, uint32_t coff, uint32_t zsize, unsigned int *fu, unsigned int fc, int *ret, cli_ctx *ctx, char *tmpd) {
50593e02
   char name[256];
   int last = 0;
e4a0f2c9
   uint8_t *ch;
50593e02
 
774898a7
   if(!(ch = fmap_need_off(map, coff, SIZEOF_CH)) || CH_magic != 0x02014b50) {
       if(ch) fmap_unneed_ptr(map, ch, SIZEOF_CH);
       cli_dbgmsg("cli_unzip: ch - wrkcomplete\n");
       return 0;
50593e02
   }
   coff+=SIZEOF_CH;
 
   cli_dbgmsg("cli_unzip: ch - flags %x - method %x - csize %x - usize %x - flen %x - elen %x - clen %x - disk %x - off %x\n", CH_flags, CH_method, CH_csize, CH_usize, CH_flen, CH_elen, CH_clen, CH_dsk, CH_off);
 
   if(zsize-coff<=CH_flen) {
     cli_dbgmsg("cli_unzip: ch - fname out of file\n");
     last=1;
   }
   if(cli_debug_flag && !last) {
774898a7
       unsigned int size = (CH_flen>=sizeof(name))?sizeof(name)-1:CH_flen;
       char *src = fmap_need_off_once(map, coff, size);
       if(src) {
 	  memcpy(name, src, size);
 	  name[size]='\0';
 	  cli_dbgmsg("cli_unzip: ch - fname: %s\n", name);
       }
50593e02
   }
   coff+=CH_flen;
 
   if(zsize-coff<=CH_elen && !last) {
     cli_dbgmsg("cli_unzip: ch - extra out of file\n");
     last=1;
   }
   coff+=CH_elen;
 
   if(zsize-coff<CH_clen && !last) {
     cli_dbgmsg("cli_unzip: ch - comment out of file\n");
     last = 1;
   }
   coff+=CH_clen;
 
   if(CH_off<zsize-SIZEOF_LH) {
4bf5eb79
       lhdr(map, CH_off, zsize-CH_off, fu, fc, ch, ret, ctx, tmpd, 1);
50593e02
   } else cli_dbgmsg("cli_unzip: ch - local hdr out of file\n");
774898a7
   fmap_unneed_ptr(map, ch, SIZEOF_CH);
50593e02
   return last?0:coff;
 }
 
 
bd7f7684
 int cli_unzip(cli_ctx *ctx) {
50593e02
   unsigned int fc=0, fu=0;
   int ret=CL_CLEAN;
   uint32_t fsize, lhoff = 0, coff = 0;
49cc1e3c
   fmap_t *map = *ctx->fmap;
774898a7
   char *tmpd, *ptr;
50593e02
 
   cli_dbgmsg("in cli_unzip\n");
bd7f7684
   fsize = (uint32_t)map->len;
   if(sizeof(off_t)!=sizeof(uint32_t) && (off_t)fsize!=map->len) {
50593e02
     cli_dbgmsg("cli_unzip: file too big\n");
     return CL_CLEAN;
   }
   if (fsize < SIZEOF_CH) {
     cli_dbgmsg("cli_unzip: file too short\n");
     return CL_CLEAN;
   }
33068e09
   if (!(tmpd = cli_gentemp(ctx->engine->tmpdir))) {
50593e02
     return CL_ETMPDIR;
0b8d9622
   }
50593e02
   if (mkdir(tmpd, 0700)) {
     cli_dbgmsg("cli_unzip: Can't create temporary directory %s\n", tmpd);
     free(tmpd);
     return CL_ETMPDIR;
   }
 
   for(coff=fsize-22 ; coff>0 ; coff--) { /* sizeof(EOC)==22 */
774898a7
       if(!(ptr = fmap_need_off_once(map, coff, 20)))
 	  continue;
       if(cli_readint32(ptr)==0x06054b50) {
 	  uint32_t chptr = cli_readint32(&ptr[16]);
 	  if(!CLI_ISCONTAINED(0, fsize, chptr, SIZEOF_CH)) continue;
 	  coff=chptr;
 	  break;
       }
50593e02
   }
 
   if(coff) {
774898a7
       cli_dbgmsg("cli_unzip: central @%x\n", coff);
bd7f7684
       while(ret==CL_CLEAN && (coff=chdr(map, coff, fsize, &fu, fc+1, &ret, ctx, tmpd))) {
774898a7
 	  fc++;
 	  if (ctx->engine->maxfiles && fu>=ctx->engine->maxfiles) {
 	      cli_dbgmsg("cli_unzip: Files limit reached (max: %u)\n", ctx->engine->maxfiles);
 	      ret=CL_EMAXFILES;
 	  }
50593e02
       }
   } else cli_dbgmsg("cli_unzip: central not found, using localhdrs\n");
   if(fu<=(fc/4)) { /* FIXME: make up a sane ratio or remove the whole logic */
     fc = 0;
4bf5eb79
     while (ret==CL_CLEAN && lhoff<fsize && (coff=lhdr(map, lhoff, fsize-lhoff, &fu, fc+1, NULL, &ret, ctx, tmpd, 1))) {
50593e02
       fc++;
       lhoff+=coff;
724b2bf7
       if (ctx->engine->maxfiles && fu>=ctx->engine->maxfiles) {
 	cli_dbgmsg("cli_unzip: Files limit reached (max: %u)\n", ctx->engine->maxfiles);
50593e02
 	ret=CL_EMAXFILES;
       }
     }
   }
 
33068e09
   if (!ctx->engine->keeptmp) cli_rmdirs(tmpd);
50593e02
   free(tmpd);
 
   return ret;
 }
 
2d5dbc37
 int cli_unzip_single(cli_ctx *ctx, off_t lhoffl) {
50593e02
   int ret=CL_CLEAN;
   unsigned int fu=0;
   uint32_t fsize;
49cc1e3c
   fmap_t *map = *ctx->fmap;
50593e02
 
   cli_dbgmsg("in cli_unzip_single\n");
2d5dbc37
   fsize = (uint32_t)(map->len - lhoffl);
   if (lhoffl<0 || lhoffl>map->len || (sizeof(off_t)!=sizeof(uint32_t) && (off_t)fsize!=map->len - lhoffl)) {
50593e02
     cli_dbgmsg("cli_unzip: bad offset\n");
     return CL_CLEAN;
   }
   if (fsize < SIZEOF_LH) {
     cli_dbgmsg("cli_unzip: file too short\n");
     return CL_CLEAN;
   }
 
4bf5eb79
   lhdr(map, lhoffl, fsize, &fu, 0, NULL, &ret, ctx, NULL, 0);
50593e02
 
   return ret;
 }