libclamav/vba_extract.c
47bbbc56
 /*
f893c0f3
  *  Extract VBA source code for component MS Office Documents
47bbbc56
  *
e1cbc270
  *  Copyright (C) 2013-2019 Cisco Systems, Inc. and/or its affiliates. All rights reserved.
80649b28
  *  Copyright (C) 2007-2013 Sourcefire, Inc.
2023340a
  *
  *  Authors: Trog, Nigel Horne
fa53d800
  *
47bbbc56
  *  This program is free software; you can redistribute it and/or modify
2023340a
  *  it under the terms of the GNU General Public License version 2 as
  *  published by the Free Software Foundation.
47bbbc56
  *
  *  This program is distributed in the hope that it will be useful,
  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  *  GNU General Public License for more details.
  *
  *  You should have received a copy of the GNU General Public License
  *  along with this program; if not, write to the Free Software
48b7b4a7
  *  Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
  *  MA 02110-1301, USA.
47bbbc56
  */
2023340a
 
fa53d800
 #if HAVE_CONFIG_H
 #include "clamav-config.h"
 #endif
47bbbc56
 
 #include <stdio.h>
 #include <string.h>
288057e9
 #ifdef HAVE_UNISTD_H
47bbbc56
 #include <unistd.h>
b58fdfc2
 #endif
47bbbc56
 #include <fcntl.h>
 #include <stdlib.h>
 #include <ctype.h>
5f02033a
 #include <zlib.h>
 
 #include "clamav.h"
47bbbc56
 
ca90717f
 #include "others.h"
72ce4b70
 #include "scanners.h"
9fe789f8
 #include "vba_extract.h"
288057e9
 #ifdef CL_DEBUG
c0195d1f
 #include "mbox.h"
 #endif
fa53d800
 #include "blob.h"
09dddc5b
 #ifdef HAVE_JSON
e182c02c
 #include "json.h"
09dddc5b
 #endif
47bbbc56
 
9294cf21
 #define PPT_LZW_BUFFSIZE 8192
 #define VBA_COMPRESSION_WINDOW 4096
288057e9
 #define MIDDLE_SIZE 20
 #define MAX_VBA_COUNT 1000 /* If there's more than 1000 macros something's up! */
9294cf21
 
9fe789f8
 #ifndef HAVE_ATTRIB_PACKED
 #define __attribute__(x)
ffd168d4
 #endif
 
9fe789f8
 /*
  * VBA (Visual Basic for Applications), versions 5 and 6
  */
ffd168d4
 struct vba56_header {
288057e9
     unsigned char magic[2];
     unsigned char version[4];
     unsigned char ignore[28];
ffd168d4
 };
 
9fe789f8
 typedef struct {
288057e9
     uint32_t sig;
     const char *ver;
     int big_endian; /* e.g. MAC Office */
47bbbc56
 } vba_version_t;
 
288057e9
 static int skip_past_nul(int fd);
 static int read_uint16(int fd, uint16_t *u, int big_endian);
 static int read_uint32(int fd, uint32_t *u, int big_endian);
 static int seekandread(int fd, off_t offset, int whence, void *data, size_t len);
 static vba_project_t *create_vba_project(int record_count, const char *dir, struct uniq *U);
9fe789f8
 
e19ed67b
 static uint16_t
 vba_endian_convert_16(uint16_t value, int big_endian)
31c42eb7
 {
288057e9
     if (big_endian)
         return (uint16_t)be16_to_host(value);
     else
         return le16_to_host(value);
337cb206
 }
fa53d800
 
9fe789f8
 /* Seems to be a duplicate of riff_endian_convert_32() */
e19ed67b
 static uint32_t
 vba_endian_convert_32(uint32_t value, int big_endian)
31c42eb7
 {
288057e9
     if (big_endian)
         return be32_to_host(value);
     else
         return le32_to_host(value);
31c42eb7
 }
337cb206
 
fa53d800
 static char *
16975455
 get_unicode_name(const char *name, int size, int big_endian)
47bbbc56
 {
288057e9
     int i, increment;
     char *newname, *ret;
25ba8c63
 
288057e9
     if ((name == NULL) || (*name == '\0') || (size <= 0))
         return NULL;
25ba8c63
 
288057e9
     newname = (char *)cli_malloc(size * 7 + 1);
     if (newname == NULL) {
241e7eb1
         cli_errmsg("get_unicode_name: Unable to allocate memory for newname\n");
288057e9
         return NULL;
241e7eb1
     }
69380565
 
288057e9
     if ((!big_endian) && (size & 0x1)) {
         cli_dbgmsg("get_unicode_name: odd number of bytes %d\n", size);
         --size;
     }
349e0502
 
288057e9
     increment = (big_endian) ? 1 : 2;
     ret       = newname;
 
     for (i = 0; i < size; i += increment) {
         if ((!(name[i] & 0x80)) && isprint(name[i])) {
             *ret++ = tolower(name[i]);
         } else {
             if ((name[i] < 10) && (name[i] >= 0)) {
                 *ret++ = '_';
                 *ret++ = (char)(name[i] + '0');
             } else {
                 uint16_t x;
                 if ((i + 1) >= size)
                     break;
eb1ccdea
                 x = (uint16_t)((name[i] < 0 ? 0 : name[i] << 8) | name[i + 1]);
288057e9
 
                 *ret++ = '_';
                 *ret++ = (char)('a' + ((x & 0xF)));
                 *ret++ = (char)('a' + ((x >> 4) & 0xF));
                 *ret++ = (char)('a' + ((x >> 8) & 0xF));
                 *ret++ = 'a';
                 *ret++ = 'a';
             }
             *ret++ = '_';
         }
     }
 
     *ret = '\0';
 
     /* Saves a lot of memory */
     ret = cli_realloc(newname, (ret - newname) + 1);
     return ret ? ret : newname;
 }
9fe789f8
 
349e0502
 static void vba56_test_middle(int fd)
 {
288057e9
     char test_middle[MIDDLE_SIZE];
 
     /* MacOffice middle */
     static const uint8_t middle1_str[MIDDLE_SIZE] = {
         0x00, 0x01, 0x0d, 0x45, 0x2e, 0xe1, 0xe0, 0x8f, 0x10, 0x1a,
         0x85, 0x2e, 0x02, 0x60, 0x8c, 0x4d, 0x0b, 0xb4, 0x00, 0x00};
     /* MS Office middle */
     static const uint8_t middle2_str[MIDDLE_SIZE] = {
         0x00, 0x00, 0xe1, 0x2e, 0x45, 0x0d, 0x8f, 0xe0, 0x1a, 0x10,
         0x85, 0x2e, 0x02, 0x60, 0x8c, 0x4d, 0x0b, 0xb4, 0x00, 0x00};
 
     if (cli_readn(fd, &test_middle, MIDDLE_SIZE) != MIDDLE_SIZE)
         return;
 
     if ((memcmp(test_middle, middle1_str, MIDDLE_SIZE) != 0) &&
         (memcmp(test_middle, middle2_str, MIDDLE_SIZE) != 0)) {
         cli_dbgmsg("middle not found\n");
         if (lseek(fd, -MIDDLE_SIZE, SEEK_CUR) == -1) {
7e40bab9
             cli_dbgmsg("vba_test_middle: call to lseek() failed\n");
             return;
         }
288057e9
     } else
         cli_dbgmsg("middle found\n");
349e0502
 }
 
dc312134
 /* return count of valid strings found, 0 on error */
ac8154d9
 static int
16975455
 vba_read_project_strings(int fd, int big_endian)
dc890a72
 {
80649b28
     unsigned char *buf = NULL;
288057e9
     uint16_t buflen    = 0;
     uint16_t length    = 0;
8c66e386
     int ret = 0, getnewlength = 1;
d489ba80
 
288057e9
     for (;;) {
80649b28
         off_t offset;
         char *name;
d92098c8
 
8c66e386
         /* if no initial name length, exit */
288057e9
         if (getnewlength && !read_uint16(fd, &length, big_endian)) {
dc312134
             ret = 0;
             break;
         }
8c66e386
         getnewlength = 0;
 
d489ba80
         /* if too short, break */
80649b28
         if (length < 6) {
             if (lseek(fd, -2, SEEK_CUR) == -1) {
7e40bab9
                 cli_dbgmsg("vba_read_project_strings: call to lseek() has failed\n");
d489ba80
                 ret = 0;
7e40bab9
             }
80649b28
             break;
         }
d489ba80
         /* ensure buffer is large enough */
288057e9
         if (length > buflen) {
80649b28
             unsigned char *newbuf = (unsigned char *)cli_realloc(buf, length);
288057e9
             if (newbuf == NULL) {
d489ba80
                 ret = 0;
                 break;
80649b28
             }
             buflen = length;
288057e9
             buf    = newbuf;
80649b28
         }
9fe789f8
 
d489ba80
         /* save current offset */
80649b28
         offset = lseek(fd, 0, SEEK_CUR);
7e40bab9
         if (offset == -1) {
             cli_dbgmsg("vba_read_project_strings: call to lseek() has failed\n");
d489ba80
             ret = 0;
             break;
7e40bab9
         }
ffd168d4
 
d489ba80
         /* if read name failed, break */
6c03dc5d
         if (cli_readn(fd, buf, (size_t)length) != (size_t)length) {
80649b28
             cli_dbgmsg("read name failed - rewinding\n");
             if (lseek(fd, offset, SEEK_SET) == -1) {
7e40bab9
                 cli_dbgmsg("call to lseek() in read name failed\n");
d489ba80
                 ret = 0;
7e40bab9
             }
80649b28
             break;
         }
         name = get_unicode_name((const char *)buf, length, big_endian);
         cli_dbgmsg("length: %d, name: %s\n", length, (name) ? name : "[null]");
dc890a72
 
d489ba80
         /* if invalid name, break */
288057e9
         if ((name == NULL) || (memcmp("*\\", name, 2) != 0) ||
             (strchr("ghcd", name[2]) == NULL)) {
d489ba80
             /* Not a valid string, rewind */
288057e9
             if (lseek(fd, -(length + 2), SEEK_CUR) == -1) {
7e40bab9
                 cli_dbgmsg("call to lseek() after get_unicode_name has failed\n");
d489ba80
                 ret = 0;
7e40bab9
             }
80649b28
             free(name);
             break;
         }
         free(name);
ac8154d9
 
d489ba80
         /* can't get length, break */
288057e9
         if (!read_uint16(fd, &length, big_endian)) {
80649b28
             break;
         }
ac8154d9
 
80649b28
         ret++;
72ce4b70
 
d489ba80
         /* continue on reasonable length value */
80649b28
         if ((length != 0) && (length != 65535)) {
             continue;
         }
d489ba80
 
         /* determine offset and run middle test */
80649b28
         offset = lseek(fd, 10, SEEK_CUR);
7e40bab9
         if (offset == -1) {
             cli_dbgmsg("call to lseek() has failed\n");
d489ba80
             ret = 0;
             break;
7e40bab9
         }
80649b28
         cli_dbgmsg("offset: %lu\n", (unsigned long)offset);
         vba56_test_middle(fd);
8c66e386
         getnewlength = 1;
80649b28
     }
d489ba80
 
80649b28
     free(buf);
     return ret;
dc890a72
 }
349e0502
 
11d24f8a
 vba_project_t *
72ce4b70
 cli_vba_readdir(const char *dir, struct uniq *U, uint32_t which)
47bbbc56
 {
288057e9
     unsigned char *buf;
     const unsigned char vba56_signature[] = {0xcc, 0x61};
     uint16_t record_count, buflen, ffff, byte_count;
     uint32_t offset;
     int i, j, fd, big_endian = FALSE;
     vba_project_t *vba_project;
     struct vba56_header v56h;
     off_t seekback;
     char fullname[1024], *hash;
49df8ea7
     uint32_t hashcnt = 0;
288057e9
 
     cli_dbgmsg("in cli_vba_readdir()\n");
 
     if (dir == NULL)
         return NULL;
 
     /*
9fe789f8
 	 * _VBA_PROJECT files are embedded within office documents (OLE2)
 	 */
288057e9
 
49df8ea7
     if (CL_SUCCESS != uniq_get(U, "_vba_project", 12, &hash, &hashcnt)) {
         cli_dbgmsg("vba_readdir: uniq_get('_vba_project') failed. Unable to check # of embedded vba proj files\n");
288057e9
         return NULL;
49df8ea7
     }
     if (hashcnt == 0) {
         return NULL;
     }
288057e9
     snprintf(fullname, sizeof(fullname), "%s" PATHSEP "%s_%u", dir, hash, which);
     fullname[sizeof(fullname) - 1] = '\0';
     fd                             = open(fullname, O_RDONLY | O_BINARY);
 
     if (fd == -1)
         return NULL;
 
     if (cli_readn(fd, &v56h, sizeof(struct vba56_header)) != sizeof(struct vba56_header)) {
         close(fd);
         return NULL;
     }
     if (memcmp(v56h.magic, vba56_signature, sizeof(v56h.magic)) != 0) {
         close(fd);
         return NULL;
     }
 
     i = vba_read_project_strings(fd, TRUE);
     if ((seekback = lseek(fd, 0, SEEK_CUR)) == -1) {
         cli_dbgmsg("vba_readdir: lseek() failed. Unable to guess VBA type\n");
         close(fd);
         return NULL;
     }
     if (lseek(fd, sizeof(struct vba56_header), SEEK_SET) == -1) {
         cli_dbgmsg("vba_readdir: lseek() failed. Unable to guess VBA type\n");
         close(fd);
         return NULL;
     }
     j = vba_read_project_strings(fd, FALSE);
     if (!i && !j) {
         close(fd);
         cli_dbgmsg("vba_readdir: Unable to guess VBA type\n");
         return NULL;
     }
     if (i > j) {
         big_endian = TRUE;
         if (lseek(fd, seekback, SEEK_SET) == -1) {
             cli_dbgmsg("vba_readdir: call to lseek() while guessing big-endian has failed\n");
             close(fd);
             return NULL;
         }
         cli_dbgmsg("vba_readdir: Guessing big-endian\n");
     } else {
         cli_dbgmsg("vba_readdir: Guessing little-endian\n");
     }
 
     /* junk some more stuff */
     do
         if (cli_readn(fd, &ffff, 2) != 2) {
             close(fd);
             return NULL;
         }
     while (ffff != 0xFFFF);
 
     /* check for alignment error */
     if (!seekandread(fd, -3, SEEK_CUR, &ffff, sizeof(uint16_t))) {
         close(fd);
         return NULL;
     }
     if (ffff != 0xFFFF) {
         if (lseek(fd, 1, SEEK_CUR) == -1) {
7e40bab9
             cli_dbgmsg("call to lseek() while checking alignment error has failed\n");
             close(fd);
             return NULL;
         }
     }
fa53d800
 
288057e9
     if (!read_uint16(fd, &ffff, big_endian)) {
         close(fd);
         return NULL;
     }
47bbbc56
 
288057e9
     if (ffff != 0xFFFF) {
         if (lseek(fd, ffff, SEEK_CUR) == -1) {
7e40bab9
             cli_dbgmsg("call to lseek() while checking alignment error has failed\n");
             close(fd);
             return NULL;
         }
     }
9fe789f8
 
288057e9
     if (!read_uint16(fd, &ffff, big_endian)) {
         close(fd);
         return NULL;
     }
47bbbc56
 
288057e9
     if (ffff == 0xFFFF)
         ffff = 0;
9fe789f8
 
288057e9
     if (lseek(fd, ffff + 100, SEEK_CUR) == -1) {
7e40bab9
         cli_dbgmsg("call to lseek() failed\n");
         close(fd);
         return NULL;
     }
9fe789f8
 
288057e9
     if (!read_uint16(fd, &record_count, big_endian)) {
         close(fd);
         return NULL;
     }
     cli_dbgmsg("vba_readdir: VBA Record count %d\n", record_count);
     if (record_count == 0) {
         /* No macros, assume clean */
         close(fd);
         return NULL;
     }
     if (record_count > MAX_VBA_COUNT) {
         /* Almost certainly an error */
         cli_dbgmsg("vba_readdir: VBA Record count too big\n");
         close(fd);
         return NULL;
     }
 
     vba_project = create_vba_project(record_count, dir, U);
     if (vba_project == NULL) {
         close(fd);
         return NULL;
     }
     buf    = NULL;
     buflen = 0;
     for (i = 0; i < record_count; i++) {
         uint16_t length;
         char *ptr;
 
         vba_project->colls[i] = 0;
         if (!read_uint16(fd, &length, big_endian))
             break;
 
         if (length == 0) {
             cli_dbgmsg("vba_readdir: zero name length\n");
             break;
         }
         if (length > buflen) {
             unsigned char *newbuf = (unsigned char *)cli_realloc(buf, length);
             if (newbuf == NULL)
                 break;
             buflen = length;
             buf    = newbuf;
         }
6c03dc5d
         if (cli_readn(fd, buf, (size_t)length) != (size_t)length) {
288057e9
             cli_dbgmsg("vba_readdir: read name failed\n");
             break;
         }
         ptr = get_unicode_name((const char *)buf, length, big_endian);
         if (ptr == NULL) break;
49df8ea7
         if (CL_SUCCESS != uniq_get(U, ptr, strlen(ptr), &hash, &hashcnt)) {
             cli_dbgmsg("vba_readdir: uniq_get('%s') failed.\n", ptr);
             free(ptr);
             break;
         }
         vba_project->colls[i] = hashcnt;
         if (0 == vba_project->colls[i]) {
288057e9
             cli_dbgmsg("vba_readdir: cannot find project %s (%s)\n", ptr, hash);
             free(ptr);
             break;
         }
         cli_dbgmsg("vba_readdir: project name: %s (%s)\n", ptr, hash);
         free(ptr);
         vba_project->name[i] = hash;
         if (!read_uint16(fd, &length, big_endian))
             break;
         lseek(fd, length, SEEK_CUR);
 
         if (!read_uint16(fd, &ffff, big_endian))
             break;
         if (ffff == 0xFFFF) {
             lseek(fd, 2, SEEK_CUR);
             if (!read_uint16(fd, &ffff, big_endian))
                 break;
             lseek(fd, ffff + 8, SEEK_CUR);
         } else
             lseek(fd, ffff + 10, SEEK_CUR);
 
         if (!read_uint16(fd, &byte_count, big_endian))
             break;
         lseek(fd, (8 * byte_count) + 5, SEEK_CUR);
         if (!read_uint32(fd, &offset, big_endian))
             break;
         cli_dbgmsg("vba_readdir: offset: %u\n", (unsigned int)offset);
         vba_project->offset[i] = offset;
         lseek(fd, 2, SEEK_CUR);
     }
 
     if (buf)
         free(buf);
 
     close(fd);
 
     if (i < record_count) {
         free(vba_project->name);
         free(vba_project->colls);
         free(vba_project->dir);
         free(vba_project->offset);
         free(vba_project);
         return NULL;
     }
 
     return vba_project;
47bbbc56
 }
 
faa0d267
 unsigned char *
6c03dc5d
 cli_vba_inflate(int fd, off_t offset, size_t *size)
47bbbc56
 {
288057e9
     unsigned int pos, shift, mask, distance, clean;
     uint8_t flag;
     uint16_t token;
     blob *b;
     unsigned char buffer[VBA_COMPRESSION_WINDOW];
 
     if (fd < 0)
         return NULL;
 
     b = blobCreate();
 
     if (b == NULL)
         return NULL;
 
     memset(buffer, 0, sizeof(buffer));
     lseek(fd, offset + 3, SEEK_SET); /* 1byte ?? , 2byte length ?? */
     clean = TRUE;
     pos   = 0;
 
     while (cli_readn(fd, &flag, 1) == 1) {
         for (mask = 1; mask < 0x100; mask <<= 1) {
             unsigned int winpos = pos % VBA_COMPRESSION_WINDOW;
             if (flag & mask) {
                 uint16_t len;
                 unsigned int srcpos;
 
                 if (!read_uint16(fd, &token, FALSE)) {
                     blobDestroy(b);
                     if (size)
                         *size = 0;
                     return NULL;
                 }
                 shift    = 12 - (winpos > 0x10) - (winpos > 0x20) - (winpos > 0x40) - (winpos > 0x80) - (winpos > 0x100) - (winpos > 0x200) - (winpos > 0x400) - (winpos > 0x800);
                 len      = (uint16_t)((token & ((1 << shift) - 1)) + 3);
                 distance = token >> shift;
 
                 srcpos = pos - distance - 1;
                 if ((((srcpos + len) % VBA_COMPRESSION_WINDOW) < winpos) &&
                     ((winpos + len) < VBA_COMPRESSION_WINDOW) &&
                     (((srcpos % VBA_COMPRESSION_WINDOW) + len) < VBA_COMPRESSION_WINDOW) &&
                     (len <= VBA_COMPRESSION_WINDOW)) {
                     srcpos %= VBA_COMPRESSION_WINDOW;
                     memcpy(&buffer[winpos], &buffer[srcpos],
                            len);
                     pos += len;
                 } else
                     while (len-- > 0) {
                         srcpos                                 = (pos - distance - 1) % VBA_COMPRESSION_WINDOW;
                         buffer[pos++ % VBA_COMPRESSION_WINDOW] = buffer[srcpos];
                     }
             } else {
                 if ((pos != 0) && (winpos == 0) && clean) {
                     if (cli_readn(fd, &token, 2) != 2) {
                         blobDestroy(b);
                         if (size)
                             *size = 0;
                         return NULL;
                     }
                     (void)blobAddData(b, buffer, VBA_COMPRESSION_WINDOW);
                     clean = FALSE;
                     break;
                 }
                 if (cli_readn(fd, &buffer[winpos], 1) == 1)
                     pos++;
             }
             clean = TRUE;
         }
     }
 
     if (blobAddData(b, buffer, pos % VBA_COMPRESSION_WINDOW) < 0) {
         blobDestroy(b);
         if (size)
             *size = 0;
         return NULL;
     }
 
     if (size)
6c03dc5d
         *size = blobGetDataSize(b);
288057e9
     return (unsigned char *)blobToMem(b);
47bbbc56
 }
7b9aed8c
 
9fe789f8
 /*
  * See also cli_filecopy()
  */
 static void
 ole_copy_file_data(int s, int d, uint32_t len)
892d2f56
 {
288057e9
     unsigned char data[FILEBUFF];
9fe789f8
 
288057e9
     while (len > 0) {
6c03dc5d
         size_t todo = MIN(sizeof(data), len);
9fe789f8
 
6c03dc5d
         if (cli_readn(s, data, todo) != todo)
288057e9
             break;
6c03dc5d
         if (cli_writen(d, data, todo) != todo)
288057e9
             break;
6c03dc5d
 
         if (todo > len) {
             break;
         } else {
             len -= todo;
         }
288057e9
     }
892d2f56
 }
 
288057e9
 int cli_scan_ole10(int fd, cli_ctx *ctx)
892d2f56
 {
288057e9
     int ofd, ret;
     uint32_t object_size;
     STATBUF statbuf;
     char *fullname;
 
     if (fd < 0)
         return CL_CLEAN;
 
     lseek(fd, 0, SEEK_SET);
     if (!read_uint32(fd, &object_size, FALSE))
         return CL_CLEAN;
 
     if (FSTAT(fd, &statbuf) == -1)
         return CL_ESTAT;
 
     if ((statbuf.st_size - object_size) >= 4) {
         /* Probably the OLE type id */
         if (lseek(fd, 2, SEEK_CUR) == -1) {
             return CL_CLEAN;
         }
 
         /* Attachment name */
         if (!skip_past_nul(fd))
             return CL_CLEAN;
 
         /* Attachment full path */
         if (!skip_past_nul(fd))
             return CL_CLEAN;
 
         /* ??? */
         if (lseek(fd, 8, SEEK_CUR) == -1)
             return CL_CLEAN;
 
         /* Attachment full path */
         if (!skip_past_nul(fd))
             return CL_CLEAN;
 
         if (!read_uint32(fd, &object_size, FALSE))
             return CL_CLEAN;
     }
     if (!(fullname = cli_gentemp(ctx ? ctx->engine->tmpdir : NULL))) {
         return CL_EMEM;
     }
     ofd = open(fullname, O_RDWR | O_CREAT | O_TRUNC | O_BINARY | O_EXCL,
                S_IWUSR | S_IRUSR);
     if (ofd < 0) {
         cli_warnmsg("cli_decode_ole_object: can't create %s\n", fullname);
         free(fullname);
         return CL_ECREAT;
     }
     cli_dbgmsg("cli_decode_ole_object: decoding to %s\n", fullname);
     ole_copy_file_data(fd, ofd, object_size);
     lseek(ofd, 0, SEEK_SET);
     ret = cli_magic_scandesc(ofd, fullname, ctx);
     close(ofd);
     if (ctx && !ctx->engine->keeptmp)
         if (cli_unlink(fullname))
             ret = CL_EUNLINK;
     free(fullname);
     return ret;
892d2f56
 }
 
9fe789f8
 /*
  * Powerpoint files
  */
 typedef struct {
288057e9
     uint16_t type;
     uint32_t length;
5f02033a
 } atom_header_t;
 
9fe789f8
 static int
 ppt_read_atom_header(int fd, atom_header_t *atom_header)
5f02033a
 {
288057e9
     uint16_t v;
     struct ppt_header {
         uint16_t ver;
         uint16_t type;
         uint32_t length;
     } h;
 
     cli_dbgmsg("in ppt_read_atom_header\n");
     if (cli_readn(fd, &h, sizeof(struct ppt_header)) != sizeof(struct ppt_header)) {
         cli_dbgmsg("read ppt_header failed\n");
         return FALSE;
     }
     v = vba_endian_convert_16(h.ver, FALSE);
     cli_dbgmsg("\tversion: 0x%.2x\n", v & 0xF);
     cli_dbgmsg("\tinstance: 0x%.2x\n", v >> 4);
 
     atom_header->type = vba_endian_convert_16(h.type, FALSE);
     cli_dbgmsg("\ttype: 0x%.4x\n", atom_header->type);
     atom_header->length = vba_endian_convert_32(h.length, FALSE);
     cli_dbgmsg("\tlength: 0x%.8x\n", (int)atom_header->length);
 
     return TRUE;
5f02033a
 }
 
9fe789f8
 /*
16975455
  * TODO: combine shared code with flatedecode() or cli_unzip_single()
  *	Needs cli_unzip_single to have a "length" argument
9fe789f8
  */
16975455
 static int
 ppt_unlzw(const char *dir, int fd, uint32_t length)
5f02033a
 {
288057e9
     int ofd;
     z_stream stream;
     unsigned char inbuff[PPT_LZW_BUFFSIZE], outbuff[PPT_LZW_BUFFSIZE];
     char fullname[NAME_MAX + 1];
 
     snprintf(fullname, sizeof(fullname) - 1, "%s" PATHSEP "ppt%.8lx.doc",
              dir, (long)lseek(fd, 0L, SEEK_CUR));
 
     ofd = open(fullname, O_WRONLY | O_CREAT | O_TRUNC | O_BINARY | O_EXCL,
                S_IWUSR | S_IRUSR);
     if (ofd == -1) {
         cli_warnmsg("ppt_unlzw: can't create %s\n", fullname);
         return FALSE;
     }
 
     stream.zalloc    = Z_NULL;
     stream.zfree     = Z_NULL;
     stream.opaque    = (void *)NULL;
     stream.next_in   = (Bytef *)inbuff;
     stream.next_out  = outbuff;
     stream.avail_out = sizeof(outbuff);
     stream.avail_in  = MIN(length, PPT_LZW_BUFFSIZE);
 
6c03dc5d
     if (cli_readn(fd, inbuff, (size_t)stream.avail_in) != (size_t)stream.avail_in) {
288057e9
         close(ofd);
         cli_unlink(fullname);
         return FALSE;
     }
     length -= stream.avail_in;
 
     if (inflateInit(&stream) != Z_OK) {
         close(ofd);
         cli_unlink(fullname);
         cli_warnmsg("ppt_unlzw: inflateInit failed\n");
         return FALSE;
     }
 
     do {
         if (stream.avail_out == 0) {
             if (cli_writen(ofd, outbuff, PPT_LZW_BUFFSIZE) != PPT_LZW_BUFFSIZE) {
                 close(ofd);
                 inflateEnd(&stream);
                 return FALSE;
             }
             stream.next_out  = outbuff;
             stream.avail_out = PPT_LZW_BUFFSIZE;
         }
         if (stream.avail_in == 0) {
             stream.next_in  = inbuff;
             stream.avail_in = MIN(length, PPT_LZW_BUFFSIZE);
6c03dc5d
             if (cli_readn(fd, inbuff, (size_t)stream.avail_in) != (size_t)stream.avail_in) {
288057e9
                 close(ofd);
                 inflateEnd(&stream);
                 return FALSE;
             }
             length -= stream.avail_in;
         }
     } while (inflate(&stream, Z_NO_FLUSH) == Z_OK);
 
6c03dc5d
     if (cli_writen(ofd, outbuff, PPT_LZW_BUFFSIZE - stream.avail_out) != (size_t)(PPT_LZW_BUFFSIZE - stream.avail_out)) {
288057e9
         close(ofd);
         inflateEnd(&stream);
         return FALSE;
     }
     close(ofd);
     return inflateEnd(&stream) == Z_OK;
5f02033a
 }
 
9fe789f8
 static const char *
 ppt_stream_iter(int fd, const char *dir)
42034091
 {
288057e9
     atom_header_t atom_header;
 
     while (ppt_read_atom_header(fd, &atom_header)) {
         if (atom_header.length == 0)
             return NULL;
 
         if (atom_header.type == 0x1011) {
             uint32_t length;
 
             /* Skip over ID */
             if (lseek(fd, sizeof(uint32_t), SEEK_CUR) == -1) {
                 cli_dbgmsg("ppt_stream_iter: seek failed\n");
                 return NULL;
             }
             length = atom_header.length - 4;
             cli_dbgmsg("length: %d\n", (int)length);
             if (!ppt_unlzw(dir, fd, length)) {
                 cli_dbgmsg("ppt_unlzw failed\n");
                 return NULL;
             }
         } else {
             off_t offset = lseek(fd, 0, SEEK_CUR);
             /* Check we don't wrap */
             if ((offset + (off_t)atom_header.length) < offset) {
                 break;
             }
             offset += atom_header.length;
             if (lseek(fd, offset, SEEK_SET) != offset) {
                 break;
             }
         }
     }
     return dir;
42034091
 }
 
9fe789f8
 char *
33068e09
 cli_ppt_vba_read(int ifd, cli_ctx *ctx)
5f02033a
 {
288057e9
     char *dir;
     const char *ret;
 
     /* Create a directory to store the extracted OLE2 objects */
     dir = cli_gentemp(ctx ? ctx->engine->tmpdir : NULL);
     if (dir == NULL)
         return NULL;
     if (mkdir(dir, 0700)) {
         cli_errmsg("cli_ppt_vba_read: Can't create temporary directory %s\n", dir);
         free(dir);
         return NULL;
     }
     ret = ppt_stream_iter(ifd, dir);
     if (ret == NULL) {
         cli_rmdirs(dir);
         free(dir);
         return NULL;
     }
     return dir;
42034091
 }
 
9fe789f8
 /*
  * Word 6 macros
  */
 typedef struct {
288057e9
     unsigned char unused[12];
     uint32_t macro_offset;
     uint32_t macro_len;
7b9aed8c
 } mso_fib_t;
 
 typedef struct macro_entry_tag {
288057e9
     uint32_t len;
     uint32_t offset;
     unsigned char key;
7b9aed8c
 } macro_entry_t;
 
 typedef struct macro_info_tag {
288057e9
     struct macro_entry_tag *entries;
     uint16_t count;
7b9aed8c
 } macro_info_t;
 
9fe789f8
 static int
 word_read_fib(int fd, mso_fib_t *fib)
7b9aed8c
 {
288057e9
     struct {
         uint32_t offset;
         uint32_t len;
     } macro_details;
 
     if (!seekandread(fd, 0x118, SEEK_SET, &macro_details, sizeof(macro_details))) {
         cli_dbgmsg("read word_fib failed\n");
         return FALSE;
     }
     fib->macro_offset = vba_endian_convert_32(macro_details.offset, FALSE);
     fib->macro_len    = vba_endian_convert_32(macro_details.len, FALSE);
 
     return TRUE;
7b9aed8c
 }
 
9fe789f8
 static int
 word_read_macro_entry(int fd, macro_info_t *macro_info)
7b9aed8c
 {
6c03dc5d
     size_t msize;
     uint16_t count = macro_info->count;
288057e9
     macro_entry_t *macro_entry;
9fe789f8
 #ifdef HAVE_PRAGMA_PACK
 #pragma pack(1)
 #endif
 
 #ifdef HAVE_PRAGMA_PACK_HPPA
 #pragma pack 1
 #endif
288057e9
     struct macro {
         unsigned char version;
         unsigned char key;
         unsigned char ignore[10];
         uint32_t len __attribute__((packed));
         uint32_t state __attribute__((packed));
         uint32_t offset __attribute__((packed));
     } * m;
     const struct macro *n;
9fe789f8
 #ifdef HAVE_PRAGMA_PACK
 #pragma pack()
 #endif
 
 #ifdef HAVE_PRAGMA_PACK_HPPA
 #pragma pack
 #endif
288057e9
     if (count == 0)
         return TRUE;
9fe789f8
 
288057e9
     msize = count * sizeof(struct macro);
     m     = cli_malloc(msize);
     if (m == NULL) {
241e7eb1
         cli_errmsg("word_read_macro_entry: Unable to allocate memory for 'm'\n");
288057e9
         return FALSE;
241e7eb1
     }
9fe789f8
 
288057e9
     if (cli_readn(fd, m, msize) != msize) {
         free(m);
6c03dc5d
         cli_warnmsg("read %u macro_entries failed\n", count);
288057e9
         return FALSE;
     }
     macro_entry = macro_info->entries;
     n           = m;
     do {
         macro_entry->key    = n->key;
         macro_entry->len    = vba_endian_convert_32(n->len, FALSE);
         macro_entry->offset = vba_endian_convert_32(n->offset, FALSE);
         macro_entry++;
         n++;
     } while (--count > 0);
     free(m);
     return TRUE;
7b9aed8c
 }
 
9fe789f8
 static macro_info_t *
 word_read_macro_info(int fd, macro_info_t *macro_info)
7b9aed8c
 {
288057e9
     if (!read_uint16(fd, &macro_info->count, FALSE)) {
         cli_dbgmsg("read macro_info failed\n");
         macro_info->count = 0;
         return NULL;
     }
     cli_dbgmsg("macro count: %d\n", macro_info->count);
     if (macro_info->count == 0)
         return NULL;
     macro_info->entries = (macro_entry_t *)cli_malloc(sizeof(macro_entry_t) * macro_info->count);
     if (macro_info->entries == NULL) {
         macro_info->count = 0;
241e7eb1
         cli_errmsg("word_read_macro_info: Unable to allocate memory for macro_info->entries\n");
288057e9
         return NULL;
     }
     if (!word_read_macro_entry(fd, macro_info)) {
         free(macro_info->entries);
         macro_info->count = 0;
         return NULL;
     }
     return macro_info;
7b9aed8c
 }
 
9fe789f8
 static int
 word_skip_oxo3(int fd)
7b9aed8c
 {
288057e9
     uint8_t count;
 
     if (cli_readn(fd, &count, 1) != 1) {
         cli_dbgmsg("read oxo3 record1 failed\n");
         return FALSE;
     }
     cli_dbgmsg("oxo3 records1: %d\n", count);
 
     if (!seekandread(fd, count * 14, SEEK_CUR, &count, 1)) {
         cli_dbgmsg("read oxo3 record2 failed\n");
         return FALSE;
     }
 
     if (count == 0) {
         uint8_t twobytes[2];
 
         if (cli_readn(fd, twobytes, 2) != 2) {
             cli_dbgmsg("read oxo3 failed\n");
             return FALSE;
         }
         if (twobytes[0] != 2) {
             lseek(fd, -2, SEEK_CUR);
             return TRUE;
         }
         count = twobytes[1];
     }
     if (count > 0)
         if (lseek(fd, (count * 4) + 1, SEEK_CUR) == -1) {
             cli_dbgmsg("lseek oxo3 failed\n");
             return FALSE;
         }
 
     cli_dbgmsg("oxo3 records2: %d\n", count);
     return TRUE;
7b9aed8c
 }
 
ac8154d9
 static int
9fe789f8
 word_skip_menu_info(int fd)
7b9aed8c
 {
288057e9
     uint16_t count;
 
     if (!read_uint16(fd, &count, FALSE)) {
         cli_dbgmsg("read menu_info failed\n");
         return FALSE;
     }
     cli_dbgmsg("menu_info count: %d\n", count);
 
     if (count)
         if (lseek(fd, count * 12, SEEK_CUR) == -1)
             return FALSE;
     return TRUE;
7b9aed8c
 }
 
a27be3c7
 static int
9fe789f8
 word_skip_macro_extnames(int fd)
7b9aed8c
 {
288057e9
     int is_unicode, nbytes;
     int16_t size;
 
     if (!read_uint16(fd, (uint16_t *)&size, FALSE)) {
         cli_dbgmsg("read macro_extnames failed\n");
         return FALSE;
     }
     if (size == -1) { /* Unicode flag */
         if (!read_uint16(fd, (uint16_t *)&size, FALSE)) {
             cli_dbgmsg("read macro_extnames failed\n");
             return FALSE;
         }
         is_unicode = 1;
     } else
         is_unicode = 0;
 
     cli_dbgmsg("ext names size: 0x%x\n", size);
 
     nbytes = size;
     while (nbytes > 0) {
         uint8_t length;
         off_t offset;
 
         if (cli_readn(fd, &length, 1) != 1) {
             cli_dbgmsg("read macro_extnames failed\n");
             return FALSE;
         }
 
         if (is_unicode)
             offset = (off_t)length * 2 + 1;
         else
             offset = (off_t)length;
 
         /* ignore numref as well */
         if (lseek(fd, offset + sizeof(uint16_t), SEEK_CUR) == -1) {
             cli_dbgmsg("read macro_extnames failed to seek\n");
             return FALSE;
         }
         nbytes -= size;
     }
     return TRUE;
7b9aed8c
 }
 
d9a9e1fc
 static int
9fe789f8
 word_skip_macro_intnames(int fd)
7b9aed8c
 {
288057e9
     uint16_t count;
 
     if (!read_uint16(fd, &count, FALSE)) {
         cli_dbgmsg("read macro_intnames failed\n");
         return FALSE;
     }
     cli_dbgmsg("intnames count: %u\n", (unsigned int)count);
 
     while (count-- > 0) {
         uint8_t length;
 
         /* id */
         if (!seekandread(fd, sizeof(uint16_t), SEEK_CUR, &length, sizeof(uint8_t))) {
             cli_dbgmsg("skip_macro_intnames failed\n");
             return FALSE;
         }
 
         /* Internal name, plus one byte of unknown data */
         if (lseek(fd, length + 1, SEEK_CUR) == -1) {
             cli_dbgmsg("skip_macro_intnames failed\n");
             return FALSE;
         }
     }
     return TRUE;
7b9aed8c
 }
 
faa0d267
 vba_project_t *
72ce4b70
 cli_wm_readdir(int fd)
7b9aed8c
 {
288057e9
     int done;
     off_t end_offset;
     unsigned char info_id;
     macro_info_t macro_info;
     vba_project_t *vba_project;
     mso_fib_t fib;
 
     if (!word_read_fib(fd, &fib))
         return NULL;
 
     if (fib.macro_len == 0) {
         cli_dbgmsg("wm_readdir: No macros detected\n");
         /* Must be clean */
         return NULL;
     }
     cli_dbgmsg("wm_readdir: macro offset: 0x%.4x\n", (int)fib.macro_offset);
     cli_dbgmsg("wm_readdir: macro len: 0x%.4x\n\n", (int)fib.macro_len);
 
     /* Go one past the start to ignore start_id */
     if (lseek(fd, fib.macro_offset + 1, SEEK_SET) != (off_t)(fib.macro_offset + 1)) {
         cli_dbgmsg("wm_readdir: lseek macro_offset failed\n");
         return NULL;
     }
 
     end_offset         = fib.macro_offset + fib.macro_len;
     done               = FALSE;
     macro_info.entries = NULL;
     macro_info.count   = 0;
 
     while ((lseek(fd, 0, SEEK_CUR) < end_offset) && !done) {
         if (cli_readn(fd, &info_id, 1) != 1) {
             cli_dbgmsg("wm_readdir: read macro_info failed\n");
             break;
         }
         switch (info_id) {
             case 0x01:
                 if (macro_info.count)
                     free(macro_info.entries);
                 word_read_macro_info(fd, &macro_info);
                 done = TRUE;
                 break;
             case 0x03:
                 if (!word_skip_oxo3(fd))
                     done = TRUE;
                 break;
             case 0x05:
                 if (!word_skip_menu_info(fd))
                     done = TRUE;
                 break;
             case 0x10:
                 if (!word_skip_macro_extnames(fd))
                     done = TRUE;
                 break;
             case 0x11:
                 if (!word_skip_macro_intnames(fd))
                     done = TRUE;
                 break;
             case 0x40: /* end marker */
             case 0x12: /* ??? */
                 done = TRUE;
                 break;
             default:
                 cli_dbgmsg("wm_readdir: unknown type: 0x%x\n", info_id);
                 done = TRUE;
         }
     }
 
     if (macro_info.count == 0)
         return NULL;
 
     vba_project = create_vba_project(macro_info.count, "", NULL);
 
     if (vba_project) {
         vba_project->length = (uint32_t *)cli_malloc(sizeof(uint32_t) *
                                                      macro_info.count);
         vba_project->key    = (unsigned char *)cli_malloc(sizeof(unsigned char) *
                                                        macro_info.count);
         if ((vba_project->length != NULL) &&
             (vba_project->key != NULL)) {
             int i;
             const macro_entry_t *m = macro_info.entries;
 
             for (i = 0; i < macro_info.count; i++) {
                 vba_project->offset[i] = m->offset;
                 vba_project->length[i] = m->len;
                 vba_project->key[i]    = m->key;
                 m++;
             }
         } else {
241e7eb1
             cli_errmsg("cli_wm_readdir: Unable to allocate memory for vba_project\n");
288057e9
             free(vba_project->name);
             free(vba_project->colls);
             free(vba_project->dir);
             free(vba_project->offset);
             if (vba_project->length)
                 free(vba_project->length);
             if (vba_project->key)
                 free(vba_project->key);
             free(vba_project);
             vba_project = NULL;
         }
     }
     free(macro_info.entries);
 
     return vba_project;
7b9aed8c
 }
 
9fe789f8
 unsigned char *
11d24f8a
 cli_wm_decrypt_macro(int fd, off_t offset, uint32_t len, unsigned char key)
7b9aed8c
 {
288057e9
     unsigned char *buff;
fa53d800
 
288057e9
     if (len == 0)
         return NULL;
faa0d267
 
288057e9
     if (fd < 0)
         return NULL;
2b459819
 
288057e9
     buff = (unsigned char *)cli_malloc(len);
     if (buff == NULL) {
241e7eb1
         cli_errmsg("cli_wm_decrypt_macro: Unable to allocate memory for buff\n");
288057e9
         return NULL;
     }
 
     if (!seekandread(fd, offset, SEEK_SET, buff, len)) {
         free(buff);
         return NULL;
241e7eb1
     }
288057e9
     if (key) {
         unsigned char *p;
7b9aed8c
 
288057e9
         for (p = buff; p < &buff[len]; p++)
             *p ^= key;
     }
     return buff;
7b9aed8c
 }
9fe789f8
 
 /*
  * Keep reading bytes until we reach a NUL. Returns 0 if none is found
  */
 static int
 skip_past_nul(int fd)
 {
f6f2869f
     char *end;
     char smallbuf[128];
 
     do {
6c03dc5d
         size_t nread = cli_readn(fd, smallbuf, sizeof(smallbuf));
         if ((nread == 0) || (nread == (size_t)-1))
288057e9
             return FALSE;
         end = memchr(smallbuf, '\0', nread);
         if (end) {
c943e22c
             if (lseek(fd, 1 + (end - smallbuf) - (off_t)nread, SEEK_CUR) < 0)
288057e9
                 return FALSE;
             return TRUE;
         }
f6f2869f
     } while (1);
9fe789f8
 }
 
 /*
  * Read 2 bytes as a 16-bit number, host byte order. Return success or fail
  */
 static int
16975455
 read_uint16(int fd, uint16_t *u, int big_endian)
9fe789f8
 {
288057e9
     if (cli_readn(fd, u, sizeof(uint16_t)) != sizeof(uint16_t))
         return FALSE;
9fe789f8
 
288057e9
     *u = vba_endian_convert_16(*u, big_endian);
9fe789f8
 
288057e9
     return TRUE;
9fe789f8
 }
 
 /*
  * Read 4 bytes as a 32-bit number, host byte order. Return success or fail
  */
 static int
16975455
 read_uint32(int fd, uint32_t *u, int big_endian)
9fe789f8
 {
288057e9
     if (cli_readn(fd, u, sizeof(uint32_t)) != sizeof(uint32_t))
         return FALSE;
9fe789f8
 
288057e9
     *u = vba_endian_convert_32(*u, big_endian);
9fe789f8
 
288057e9
     return TRUE;
9fe789f8
 }
 
 /*
  * Miss some bytes then read a bit
  */
 static int
 seekandread(int fd, off_t offset, int whence, void *data, size_t len)
 {
288057e9
     if (lseek(fd, offset, whence) == (off_t)-1) {
         cli_dbgmsg("lseek failed\n");
         return FALSE;
     }
6c03dc5d
     return cli_readn(fd, data, len) == len;
9fe789f8
 }
 
 /*
  * Create and initialise a vba_project structure
  */
 static vba_project_t *
72ce4b70
 create_vba_project(int record_count, const char *dir, struct uniq *U)
9fe789f8
 {
288057e9
     vba_project_t *ret;
9fe789f8
 
49df8ea7
     ret = (vba_project_t *)cli_calloc(1, sizeof(struct vba_project_tag));
9fe789f8
 
288057e9
     if (ret == NULL) {
241e7eb1
         cli_errmsg("create_vba_project: Unable to allocate memory for vba project structure\n");
288057e9
         return NULL;
241e7eb1
     }
9fe789f8
 
288057e9
     ret->name   = (char **)cli_malloc(sizeof(char *) * record_count);
     ret->colls  = (uint32_t *)cli_malloc(sizeof(uint32_t) * record_count);
     ret->dir    = cli_strdup(dir);
     ret->offset = (uint32_t *)cli_malloc(sizeof(uint32_t) * record_count);
 
49df8ea7
     if ((ret->colls == NULL) || (ret->name == NULL) || (ret->dir == NULL) || (ret->offset == NULL)) {
         cli_free_vba_project(ret);
241e7eb1
         cli_errmsg("create_vba_project: Unable to allocate memory for vba project elements\n");
288057e9
         return NULL;
     }
     ret->count = record_count;
     ret->U     = U;
9fe789f8
 
288057e9
     return ret;
9fe789f8
 }
49df8ea7
 
 /**
  * @brief Free up the memory associated with the vba_project_t type.
  *
  * @param project A vba_project_t type allocated by one of these:
  *  - create_vba_project()
  *  - cli_wm_readdir()
  *  - cli_vba_readdir()
  */
 void cli_free_vba_project(vba_project_t *vba_project)
 {
     if (vba_project) {
         if (vba_project->dir)
             free(vba_project->dir);
         if (vba_project->colls)
             free(vba_project->colls);
         if (vba_project->name)
             free(vba_project->name);
         if (vba_project->offset)
             free(vba_project->offset);
         if (vba_project->length)
             free(vba_project->length);
         if (vba_project->key)
             free(vba_project->key);
         free(vba_project);
     }
 
     return;
 }