libclamav/matcher-ac.c
8000d078
 /*
c442ca9c
  *  Copyright (C) 2013-2019 Cisco Systems, Inc. and/or its affiliates. All rights reserved.
  *  Copyright (C) 2007-2013 Sourcefire, Inc.
1a2906f4
  *
2023340a
  *  Authors: Tomasz Kojm
8000d078
  *
  *  This program is free software; you can redistribute it and/or modify
bb34cb31
  *  it under the terms of the GNU General Public License version 2 as
  *  published by the Free Software Foundation.
8000d078
  *
  *  This program is distributed in the hope that it will be useful,
  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  *  GNU General Public License for more details.
  *
  *  You should have received a copy of the GNU General Public License
  *  along with this program; if not, write to the Free Software
48b7b4a7
  *  Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
  *  MA 02110-1301, USA.
8000d078
  */
 
 #if HAVE_CONFIG_H
 #include "clamav-config.h"
 #endif
 
 #include <stdio.h>
 #include <string.h>
 #include <stdlib.h>
677fc4ba
 #include <ctype.h>
6bb841e8
 #include <sys/stat.h>
563582a1
 
 #include <assert.h>
9290ddf2
 #ifdef HAVE_UNISTD_H
8000d078
 #include <unistd.h>
b58fdfc2
 #endif
8000d078
 
 #include "clamav.h"
 #include "others.h"
b68d11d2
 #include "matcher.h"
8000d078
 #include "matcher-ac.h"
 #include "filetypes.h"
fbcef1b0
 #include "str.h"
b5513f8d
 #include "readdb.h"
589d8d8e
 #include "default.h"
02eabc6d
 #include "filtering.h"
8000d078
 
b94e66c4
 #include "mpool.h"
 
9290ddf2
 #define AC_SPECIAL_ALT_CHAR             1
 #define AC_SPECIAL_ALT_STR_FIXED        2
 #define AC_SPECIAL_ALT_STR              3
 #define AC_SPECIAL_LINE_MARKER          4
 #define AC_SPECIAL_BOUNDARY             5
 #define AC_SPECIAL_WORD_MARKER          6
 
 #define AC_BOUNDARY_LEFT                0x0001
 #define AC_BOUNDARY_LEFT_NEGATIVE       0x0002
 #define AC_BOUNDARY_RIGHT               0x0004
 #define AC_BOUNDARY_RIGHT_NEGATIVE      0x0008
 #define AC_LINE_MARKER_LEFT             0x0010
 #define AC_LINE_MARKER_LEFT_NEGATIVE    0x0020
 #define AC_LINE_MARKER_RIGHT            0x0040
 #define AC_LINE_MARKER_RIGHT_NEGATIVE   0x0080
 #define AC_WORD_MARKER_LEFT             0x0100
 #define AC_WORD_MARKER_LEFT_NEGATIVE    0x0200
 #define AC_WORD_MARKER_RIGHT            0x0400
 #define AC_WORD_MARKER_RIGHT_NEGATIVE   0x0800
8c3c77b4
 
 static char boundary[256] = {
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 2, 0, 0, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
     3, 0, 2, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 3, 1, 3, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 2, 2, 0, 
     1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
     0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0
 };
 
3e265c46
 static inline int insert_list(struct cli_matcher *root, struct cli_ac_patt *pattern, struct cli_ac_node *pt)
8000d078
 {
3e265c46
     struct cli_ac_list *ph, *new, *ph_prev, *ph_add_after;
     struct cli_ac_list **newtable;
51ca644c
     struct cli_ac_patt *php;
e772c090
     struct cli_ac_special *a1, *a2;
59506ff5
     struct cli_alt_node *b1, *b2;
cc12e21d
     int match;
     uint16_t i, j;
e772c090
 
3e265c46
     new = (struct cli_ac_list *)mpool_calloc(root->mempool, 1, sizeof(struct cli_ac_list));
51ca644c
     if (!new) {
3e265c46
         cli_errmsg("cli_ac_addpatt: Can't allocate memory for list node\n");
e772c090
         return CL_EMEM;
fbcef1b0
     }
51ca644c
     new->me = pattern;
e38ab7c1
 
3e265c46
     root->ac_lists++;
     newtable = mpool_realloc(root->mempool, root->ac_listtable, root->ac_lists * sizeof(struct cli_ac_list *));
     if(!newtable) {
         root->ac_lists--;
         cli_errmsg("cli_ac_addpatt: Can't realloc ac_listtable\n");
         mpool_free(root->mempool, new);
         return CL_EMEM;
     }
 
     root->ac_listtable = newtable;
     root->ac_listtable[root->ac_lists - 1] = new;
 
e38ab7c1
     ph = pt->list;
b87fe385
     ph_add_after = ph_prev = NULL;
e38ab7c1
     while(ph) {
51ca644c
         php = ph->me;
         if(!ph_add_after && php->partno <= pattern->partno && (!ph->next || ph->next->me->partno > pattern->partno))
e772c090
             ph_add_after = ph;
f2102544
         if((php->length[0] == pattern->length[0]) && (php->prefix_length[0] == pattern->prefix_length[0]) && (php->ch[0] == pattern->ch[0]) && (php->ch[1] == pattern->ch[1]) && (php->boundary == pattern->boundary)) {
             if(!memcmp(php->pattern, pattern->pattern, php->length[0] * sizeof(uint16_t)) && !memcmp(php->prefix, pattern->prefix, php->prefix_length[0] * sizeof(uint16_t))) {
51ca644c
                 if(!php->special && !pattern->special) {
e772c090
                     match = 1;
51ca644c
                 } else if(php->special == pattern->special) {
e772c090
                     match = 1;
51ca644c
                     for(i = 0; i < php->special; i++) {
                         a1 = php->special_table[i];
e772c090
                         a2 = pattern->special_table[i];
 
                         if(a1->num != a2->num) {
                             match = 0;
                             break;
                         }
 
                         if(a1->negative != a2->negative) {
                             match = 0;
                             break;
                         }
 
                         if(a1->type != a2->type) {
                             match = 0;
                             break;
                         } else if(a1->type == AC_SPECIAL_ALT_CHAR) {
59506ff5
                             if(memcmp((a1->alt).byte, (a2->alt).byte, a1->num)) {
51ca644c
                                 match = 0;
                                 break;
e772c090
                             }
59506ff5
                         } else if(a1->type == AC_SPECIAL_ALT_STR_FIXED) {
9290ddf2
                             if(a1->len != a2->len) {
                                 match = 0;
                                 break;
                             }
 
                             for(j = 0; j < a1->num; j++) {
b7d0b832
                                 if(memcmp((a1->alt).f_str[j], (a2->alt).f_str[j], a1->len[0]))
9290ddf2
                                     break;
                             }
 
                             if(j < a1->num) {
                                 match = 0;
                                 break;
                             }
e772c090
                         } else if(a1->type == AC_SPECIAL_ALT_STR) {
9290ddf2
                             b1 = (a1->alt).v_str;
                             b2 = (a2->alt).v_str;
                             while(b1 && b2) {
                                 if((b1->len != b2->len) || memcmp(b1->str, b2->str, b1->len))
                                     break;
                                 b1 = b1->next;
                                 b2 = b2->next;
                             }
 
                             if(b1 || b2) {
                                 match = 0;
                                 break;
                             }
                         }
e772c090
                     }
                 } else {
                     match = 0;
                 }
 
                 if(match) {
51ca644c
                     if(pattern->partno < php->partno) {
                         new->next_same = ph;
e772c090
                         if(ph_prev)
                             ph_prev->next = ph->next;
                         else
                             pt->list = ph->next;
 
                         ph->next = NULL;
                         break;
                     } else {
51ca644c
                         while(ph->next_same && ph->next_same->me->partno < pattern->partno)
e772c090
                             ph = ph->next_same;
 
51ca644c
                         new->next_same = ph->next_same;
                         ph->next_same = new;
e772c090
                         return CL_SUCCESS;
                     }
                 }
             }
         }
 
         ph_prev = ph;
         ph = ph->next;
51ca644c
 
e38ab7c1
     }
 
b87fe385
     if(ph_add_after) {
51ca644c
         new->next = ph_add_after->next;
         ph_add_after->next = new;
b87fe385
     } else {
51ca644c
         new->next = pt->list;
         pt->list = new;
b87fe385
     }
8000d078
 
8d3aca30
     return CL_SUCCESS;
8000d078
 }
 
51ca644c
 static inline struct cli_ac_node *add_new_node(struct cli_matcher *root, uint16_t i, uint16_t len)
 {
     struct cli_ac_node *new;
     struct cli_ac_node **newtable;
 
     new = (struct cli_ac_node *) mpool_calloc(root->mempool, 1, sizeof(struct cli_ac_node));
     if(!new) {
         cli_errmsg("cli_ac_addpatt: Can't allocate memory for AC node\n");
         return NULL;
     }
 
     if(i != len - 1) {
         new->trans = (struct cli_ac_node **) mpool_calloc(root->mempool, 256, sizeof(struct cli_ac_node *));
         if(!new->trans) {
             cli_errmsg("cli_ac_addpatt: Can't allocate memory for new->trans\n");
             mpool_free(root->mempool, new);
             return NULL;
         }
     }
 
     root->ac_nodes++;
     newtable = mpool_realloc(root->mempool, root->ac_nodetable, root->ac_nodes * sizeof(struct cli_ac_node *));
     if(!newtable) {
         root->ac_nodes--;
         cli_errmsg("cli_ac_addpatt: Can't realloc ac_nodetable\n");
         if(new->trans)
             mpool_free(root->mempool, new->trans);
         mpool_free(root->mempool, new);
         return NULL;
     }
 
     root->ac_nodetable = newtable;
     root->ac_nodetable[root->ac_nodes - 1] = new;
 
     return new;
 }
 
 static int cli_ac_addpatt_recursive(struct cli_matcher *root, struct cli_ac_patt *pattern, struct cli_ac_node *pt, uint16_t i, uint16_t len)
 {
     struct cli_ac_node *next;
     int ret;
 
     /* last node, insert pattern here (base case)*/
     if(i >= len) {
3e265c46
         return insert_list(root, pattern, pt);
51ca644c
     }
 
     /* if current node has no trans table, generate one */
     if(!pt->trans) {
         pt->trans = (struct cli_ac_node **) mpool_calloc(root->mempool, 256, sizeof(struct cli_ac_node *));
         if(!pt->trans) {
             cli_errmsg("cli_ac_addpatt: Can't allocate memory for pt->trans\n");
             return CL_EMEM;
         }
     }
 
     /* if pattern is nocase, we need to enumerate all the combinations if applicable
      * it's why this function was re-written to be recursive
      */
dc70379a
     if((pattern->sigopts & ACPATT_OPTION_NOCASE) && isalpha(pattern->pattern[i] & 0xff)) {
51ca644c
         next = pt->trans[cli_nocasei((unsigned char) (pattern->pattern[i] & 0xff))];
         if(!next)
             next = add_new_node(root, i, len);
         if(!next)
             return CL_EMEM;
         else
             pt->trans[cli_nocasei((unsigned char) (pattern->pattern[i] & 0xff))] = next;
 
         if ((ret = cli_ac_addpatt_recursive(root, pattern, next, i+1, len)) != CL_SUCCESS)
             return ret;
     }
 
     /* normal transition, also enumerates the 'normal' nocase */
     next = pt->trans[(unsigned char) (pattern->pattern[i] & 0xff)];
     if(!next)
         next = add_new_node(root, i, len);
     if(!next)
         return CL_EMEM;
     else
         pt->trans[(unsigned char) (pattern->pattern[i] & 0xff)] = next;
 
     return cli_ac_addpatt_recursive(root, pattern, next, i+1, len);
 }
 
 int cli_ac_addpatt(struct cli_matcher *root, struct cli_ac_patt *pattern)
 {
     struct cli_ac_patt **newtable;
f2102544
     uint16_t len = MIN(root->ac_maxdepth, pattern->length[0]);
cc12e21d
     uint16_t i;
51ca644c
 
     for(i = 0; i < len; i++) {
         if(pattern->pattern[i] & CLI_MATCH_WILDCARD) {
             len = i;
             break;
         }
     }
 
     if(len < root->ac_mindepth) {
         /* cli_errmsg("cli_ac_addpatt: Signature for %s is too short\n", pattern->virname); */
         return CL_EMALFDB;
     }
 
     /* pattern added to master list */
     root->ac_patterns++;
     newtable = mpool_realloc(root->mempool, root->ac_pattable, root->ac_patterns * sizeof(struct cli_ac_patt *));
     if(!newtable) {
         root->ac_patterns--;
         cli_errmsg("cli_ac_addpatt: Can't realloc ac_pattable\n");
         return CL_EMEM;
     }
 
     root->ac_pattable = newtable;
     root->ac_pattable[root->ac_patterns - 1] = pattern;
 
     pattern->depth = len;
 
     return cli_ac_addpatt_recursive(root, pattern, root->ac_root, 0, len);
 }
 
fbcef1b0
 struct bfs_list {
     struct cli_ac_node *node;
     struct bfs_list *next;
 };
 
1a648b37
 static int bfs_enqueue(struct bfs_list **bfs, struct bfs_list **last, struct cli_ac_node *n)
8000d078
 {
e772c090
     struct bfs_list *new;
8000d078
 
fbcef1b0
     new = (struct bfs_list *) cli_malloc(sizeof(struct bfs_list));
     if(!new) {
e772c090
         cli_errmsg("bfs_enqueue: Can't allocate memory for bfs_list\n");
         return CL_EMEM;
8000d078
     }
e772c090
 
1a648b37
     new->next = NULL;
8000d078
     new->node = n;
1a648b37
 
     if(*last) {
e772c090
         (*last)->next = new;
         *last = new;
1a648b37
     } else {
e772c090
         *bfs = *last = new;
1a648b37
     }
fbcef1b0
 
8d3aca30
     return CL_SUCCESS;
8000d078
 }
 
a2f97877
 static struct cli_ac_node *bfs_dequeue(struct bfs_list **bfs, struct bfs_list **last)
8000d078
 {
e772c090
     struct bfs_list *lpt;
     struct cli_ac_node *pt;
8000d078
 
1a648b37
     if(!(lpt = *bfs)) {
e772c090
         return NULL;
8000d078
     } else {
e772c090
         *bfs = (*bfs)->next;
         pt = lpt->node;
 
         if(lpt == *last)
             *last = NULL;
 
         free(lpt);
         return pt;
8000d078
     }
 }
 
fbcef1b0
 static int ac_maketrans(struct cli_matcher *root)
8000d078
 {
e772c090
     struct bfs_list *bfs = NULL, *bfs_last = NULL;
     struct cli_ac_node *ac_root = root->ac_root, *child, *node, *fail;
     int i, ret;
8000d078
 
fbcef1b0
     for(i = 0; i < 256; i++) {
e772c090
         node = ac_root->trans[i];
         if(!node) {
             ac_root->trans[i] = ac_root;
         } else {
             node->fail = ac_root;
             if((ret = bfs_enqueue(&bfs, &bfs_last, node)))
                 return ret;
         }
8000d078
     }
 
a2f97877
     while((node = bfs_dequeue(&bfs, &bfs_last))) {
e772c090
         if(IS_LEAF(node)) {
             struct cli_ac_node *failtarget = node->fail;
 
             while (NULL != failtarget && (IS_LEAF(failtarget) || !IS_FINAL(failtarget)))
                 failtarget = failtarget->fail;
 
51c9a991
             if (NULL != failtarget)
                 node->fail = failtarget;
e772c090
 
             continue;
         }
 
         for(i = 0; i < 256; i++) {
             child = node->trans[i];
             if(child) {
                 fail = node->fail;
 
                 while(IS_LEAF(fail) || !fail->trans[i])
                     fail = fail->fail;
 
                 child->fail = fail->trans[i];
 
                 if((ret = bfs_enqueue(&bfs, &bfs_last, child)) != 0)
                     return ret;
             }
         }
8000d078
     }
fbcef1b0
 
a305a261
     bfs = bfs_last = NULL;
     for(i = 0; i < 256; i++) {
e772c090
         node = ac_root->trans[i];
         if(node != ac_root) {
             if((ret = bfs_enqueue(&bfs, &bfs_last, node)))
9290ddf2
                 return ret;
e772c090
         }
a305a261
     }
e772c090
 
a305a261
     while((node = bfs_dequeue(&bfs, &bfs_last))) {
e772c090
         if(IS_LEAF(node))
             continue;
         for(i = 0; i < 256; i++) {
             child = node->trans[i];
             if (!child || (!IS_FINAL(child) && IS_LEAF(child))) {
                 struct cli_ac_node *failtarget = node->fail;
 
                 while(IS_LEAF(failtarget) || !failtarget->trans[i])
                     failtarget = failtarget->fail;
 
                 failtarget = failtarget->trans[i];
                 node->trans[i] = failtarget;
             } else if (IS_FINAL(child) && IS_LEAF(child)) {
3e265c46
                 struct cli_ac_list *list;
e772c090
 
                 list = child->list;
                 if (list) {
                     while (list->next)
                         list = list->next;
 
                     list->next = child->fail->list;
                 } else {
                     child->list = child->fail->list;
                 }
 
                 child->trans = child->fail->trans;
             } else {
                 if((ret = bfs_enqueue(&bfs, &bfs_last, child)) != 0)
                     return ret;
             }
         }
a305a261
     }
 
8d3aca30
     return CL_SUCCESS;
8000d078
 }
 
5612732c
 int cli_ac_buildtrie(struct cli_matcher *root)
8000d078
 {
     if(!root)
e772c090
         return CL_EMALFDB;
8000d078
 
e772c090
     if(!(root->ac_root)) {
         cli_dbgmsg("cli_ac_buildtrie: AC pattern matcher is not initialised\n");
         return CL_SUCCESS;
8000d078
     }
 
380ae304
     if (root->filter)
e772c090
         cli_dbgmsg("Using filter for trie %d\n", root->type);
 
fbcef1b0
     return ac_maketrans(root);
8000d078
 }
 
23d7c6e6
 int cli_ac_init(struct cli_matcher *root, uint8_t mindepth, uint8_t maxdepth, uint8_t dconf_prefiltering)
8000d078
 {
563582a1
 #ifdef USE_MPOOL
     assert(root->mempool && "mempool must be initialized");
 #endif
8000d078
 
47d40feb
     root->ac_root = (struct cli_ac_node *) mpool_calloc(root->mempool, 1, sizeof(struct cli_ac_node));
fbcef1b0
     if(!root->ac_root) {
e772c090
         cli_errmsg("cli_ac_init: Can't allocate memory for ac_root\n");
         return CL_EMEM;
fbcef1b0
     }
8000d078
 
47d40feb
     root->ac_root->trans = (struct cli_ac_node **) mpool_calloc(root->mempool, 256, sizeof(struct cli_ac_node *));
fbcef1b0
     if(!root->ac_root->trans) {
e772c090
         cli_errmsg("cli_ac_init: Can't allocate memory for ac_root->trans\n");
         mpool_free(root->mempool, root->ac_root);
         return CL_EMEM;
8000d078
     }
fbcef1b0
 
     root->ac_mindepth = mindepth;
     root->ac_maxdepth = maxdepth;
 
5b74e89a
     if (cli_mtargets[root->type].enable_prefiltering && dconf_prefiltering) {
e772c090
         root->filter = mpool_malloc(root->mempool, sizeof(*root->filter));
         if (!root->filter) {
             cli_errmsg("cli_ac_init: Can't allocate memory for ac_root->filter\n");
             mpool_free(root->mempool, root->ac_root->trans);
             mpool_free(root->mempool, root->ac_root);
             return CL_EMEM;
         }
         filter_init(root->filter);
02eabc6d
     }
 
fbcef1b0
     return CL_SUCCESS;
8000d078
 }
 
b94e66c4
 #ifdef USE_MPOOL
a6d4c62e
 #define mpool_ac_free_special(a, b) ac_free_special(a, b)
 static void ac_free_special(mpool_t *mempool, struct cli_ac_patt *p)
b94e66c4
 #else
a6d4c62e
 #define mpool_ac_free_special(a, b) ac_free_special(b)
 static void ac_free_special(struct cli_ac_patt *p)
b94e66c4
 #endif
1a648b37
 {
59506ff5
     unsigned int i, j;
     struct cli_ac_special *a1;
     struct cli_alt_node *b1, *b2;
1a648b37
 
 
a6d4c62e
     if(!p->special)
e772c090
         return;
1a648b37
 
a6d4c62e
     for(i = 0; i < p->special; i++) {
e772c090
         a1 = p->special_table[i];
9290ddf2
         if (a1->type == AC_SPECIAL_ALT_CHAR) {
             mpool_free(mempool, (a1->alt).byte);
         } else if (a1->type == AC_SPECIAL_ALT_STR_FIXED) {
             for (j = 0; j < a1->num; j++)
                 mpool_free(mempool, (a1->alt).f_str[j]);
             mpool_free(mempool, (a1->alt).f_str);
         } else if (a1->type == AC_SPECIAL_ALT_STR) {
             b1 = (a1->alt).v_str;
             while (b1) {
                 b2 = b1->next;
                 mpool_free(mempool, b1->str);
                 mpool_free(mempool, b1);
                 b1 = b2;
             }
         }
         mpool_free(mempool, a1);
1a648b37
     }
a6d4c62e
     mpool_free(mempool, p->special_table);
1a648b37
 }
 
5612732c
 void cli_ac_free(struct cli_matcher *root)
8000d078
 {
e772c090
     uint32_t i;
     struct cli_ac_patt *patt;
8000d078
 
fbcef1b0
     for(i = 0; i < root->ac_patterns; i++) {
e772c090
         patt = root->ac_pattable[i];
         mpool_free(root->mempool, patt->prefix ? patt->prefix : patt->pattern);
         mpool_free(root->mempool, patt->virname);
         if(patt->special)
             mpool_ac_free_special(root->mempool, patt);
         mpool_free(root->mempool, patt);
fbcef1b0
     }
e772c090
 
fbcef1b0
     if(root->ac_pattable)
e772c090
         mpool_free(root->mempool, root->ac_pattable);
fbcef1b0
 
33872a43
     if(root->ac_reloff)
e772c090
         mpool_free(root->mempool, root->ac_reloff);
33872a43
 
74628936
     /* Freeing trans nodes must be done before freeing table nodes! */
8000d078
     for(i = 0; i < root->ac_nodes; i++) {
e772c090
         if(!IS_LEAF(root->ac_nodetable[i]) &&
            root->ac_nodetable[i]->fail &&
            root->ac_nodetable[i]->trans != root->ac_nodetable[i]->fail->trans) {
             mpool_free(root->mempool, root->ac_nodetable[i]->trans);
         }
74628936
     }
 
3e265c46
     for(i = 0; i < root->ac_lists; i++)
         mpool_free(root->mempool, root->ac_listtable[i]);
 
     if(root->ac_listtable)
         mpool_free(root->mempool, root->ac_listtable);
31ab943a
 
e772c090
     for(i = 0; i < root->ac_nodes; i++)
         mpool_free(root->mempool, root->ac_nodetable[i]);
8000d078
 
     if(root->ac_nodetable)
e772c090
         mpool_free(root->mempool, root->ac_nodetable);
 
fbcef1b0
     if(root->ac_root) {
e772c090
         mpool_free(root->mempool, root->ac_root->trans);
         mpool_free(root->mempool, root->ac_root);
fbcef1b0
     }
e772c090
 
02eabc6d
     if (root->filter)
e772c090
         mpool_free(root->mempool, root->filter);
8000d078
 }
 
677fc4ba
 /*
  * In parse_only mode this function returns -1 on error or the max subsig id
  */
ee8bd2fb
 int cli_ac_chklsig(const char *expr, const char *end, uint32_t *lsigcnt, unsigned int *cnt, uint64_t *ids, unsigned int parse_only)
677fc4ba
 {
e772c090
     unsigned int i, len = end - expr, pth = 0, opoff = 0, op1off = 0, val;
     unsigned int blkend = 0, id, modval1, modval2 = 0, lcnt = 0, rcnt = 0, tcnt, modoff = 0;
     uint64_t lids = 0, rids = 0, tids;
     int ret, lval, rval;
     char op = 0, op1 = 0, mod = 0, blkmod = 0;
     const char *lstart = expr, *lend = NULL, *rstart = NULL, *rend = end, *pt;
677fc4ba
 
     for(i = 0; i < len; i++) {
e772c090
         switch(expr[i]) {
         case '(':
             pth++;
             break;
 
         case ')':
             if(!pth) {
                 cli_errmsg("cli_ac_chklsig: Syntax error: Missing opening parenthesis\n");
                 return -1;
             }
             pth--;
 
         case '>':
         case '<':
         case '=':
             mod = expr[i];
             modoff = i;
             break;
 
         default:
             if(strchr("&|", expr[i])) {
                 if(!pth) {
                     op = expr[i];
                     opoff = i;
                 } else if(pth == 1) {
                     op1 = expr[i];
                     op1off = i;
                 }
             }
         }
 
         if(op)
             break;
 
         if(op1 && !pth) {
             blkend = i;
             if(expr[i + 1] == '>' || expr[i + 1] == '<' || expr[i + 1] == '=') {
                 blkmod = expr[i + 1];
 
                 ret = sscanf(&expr[i + 2], "%u,%u", &modval1, &modval2);
                 if(ret != 2)
                     ret = sscanf(&expr[i + 2], "%u", &modval1);
 
                 if(!ret || ret == EOF) {
                     cli_errmsg("chklexpr: Syntax error: Missing number after '%c'\n", expr[i + 1]);
                     return -1;
                 }
 
                 for(i += 2; i + 1 < len && (isdigit(expr[i + 1]) || expr[i + 1] == ','); i++)
                     ;
             }
 
             if(&expr[i + 1] == rend)
                 break;
             else
                 blkmod = 0;
         }
677fc4ba
     }
 
     if(pth) {
e772c090
         cli_errmsg("cli_ac_chklsig: Syntax error: Missing closing parenthesis\n");
         return -1;
677fc4ba
     }
 
     if(!op && !op1) {
e772c090
         if(expr[0] == '(')
             return cli_ac_chklsig(++expr, --end, lsigcnt, cnt, ids, parse_only);
 
         ret = sscanf(expr, "%u", &id);
         if(!ret || ret == EOF) {
             cli_errmsg("cli_ac_chklsig: Can't parse %s\n", expr);
             return -1;
         }
 
         if(parse_only)
             val = id;
         else
             val = lsigcnt[id];
 
         if(mod) {
             pt = expr + modoff + 1;
             ret = sscanf(pt, "%u", &modval1);
             if(!ret || ret == EOF) {
                 cli_errmsg("chklexpr: Syntax error: Missing number after '%c'\n", mod);
                 return -1;
             }
 
             if(!parse_only) {
                 switch(mod) {
                 case '=':
                     if(val != modval1)
                         return 0;
                     break;
                 case '<':
                     if(val >= modval1)
                         return 0;
                     break;
                 case '>':
                     if(val <= modval1)
                         return 0;
                     break;
                 default:
                     return 0;
                 }
 
                 *cnt += val;
                 *ids |= (uint64_t) 1 << id;
                 return 1;
             }
         }
 
         if(parse_only) {
             return val;
         } else {
             if(val) {
                 *cnt += val;
                 *ids |= (uint64_t) 1 << id;
                 return 1;
             } else {
                 return 0;
             }
         }
677fc4ba
     }
 
     if(!op) {
e772c090
         op = op1;
         opoff = op1off;
         lstart++;
         rend = &expr[blkend];
677fc4ba
     }
 
     if(!opoff) {
e772c090
         cli_errmsg("cli_ac_chklsig: Syntax error: Missing left argument\n");
         return -1;
677fc4ba
     }
e772c090
 
677fc4ba
     lend = &expr[opoff];
     if(opoff + 1 == len) {
e772c090
         cli_errmsg("cli_ac_chklsig: Syntax error: Missing right argument\n");
         return -1;
677fc4ba
     }
e772c090
 
677fc4ba
     rstart = &expr[opoff + 1];
 
ee8bd2fb
     lval = cli_ac_chklsig(lstart, lend, lsigcnt, &lcnt, &lids, parse_only);
677fc4ba
     if(lval == -1) {
e772c090
         cli_errmsg("cli_ac_chklsig: Calculation of lval failed\n");
         return -1;
677fc4ba
     }
 
ee8bd2fb
     rval = cli_ac_chklsig(rstart, rend, lsigcnt, &rcnt, &rids, parse_only);
677fc4ba
     if(rval == -1) {
e772c090
         cli_errmsg("cli_ac_chklsig: Calculation of rval failed\n");
         return -1;
677fc4ba
     }
 
     if(parse_only) {
e772c090
         switch(op) {
         case '&':
         case '|':
             return MAX(lval, rval);
         default:
             cli_errmsg("cli_ac_chklsig: Incorrect operator type\n");
             return -1;
         }
677fc4ba
     } else {
e772c090
         switch(op) {
         case '&':
             ret = lval && rval;
             break;
         case '|':
             ret = lval || rval;
             break;
         default:
             cli_errmsg("cli_ac_chklsig: Incorrect operator type\n");
             return -1;
         }
 
         if(!blkmod) {
             if(ret) {
                 *cnt += lcnt + rcnt;
                 *ids |= lids | rids;
             }
 
             return ret;
         } else {
             if(ret) {
                 tcnt = lcnt + rcnt;
                 tids = lids | rids;
             } else {
                 tcnt = 0;
                 tids = 0;
             }
 
             switch(blkmod) {
             case '=':
                 if(tcnt != modval1)
                     return 0;
                 break;
             case '<':
                 if(tcnt >= modval1)
                     return 0;
                 break;
             case '>':
                 if(tcnt <= modval1)
                     return 0;
                 break;
             default:
                 return 0;
             }
 
             if(modval2) {
                 val = 0;
                 while(tids) {
                     val += tids & (uint64_t) 1;
                     tids >>= 1;
                 }
 
                 if(val < modval2)
                     return 0;
             }
 
             *cnt += tcnt;
             return 1;
         }
677fc4ba
     }
 }
 
a2345bb5
 inline static int ac_findmatch_special(const unsigned char *buffer, uint32_t offset, uint32_t bp, uint32_t fileoffset, uint32_t length,
                                        const struct cli_ac_patt *pattern, uint32_t pp, uint16_t specialcnt, uint32_t *start, uint32_t *end, int rev);
 static int ac_backward_match_branch(const unsigned char *buffer, uint32_t bp, uint32_t offset, uint32_t length, uint32_t fileoffset,
                                     const struct cli_ac_patt *pattern, uint32_t pp, uint16_t specialcnt, uint32_t *start, uint32_t *end);
 static int ac_forward_match_branch(const unsigned char *buffer, uint32_t bp, uint32_t offset, uint32_t length, uint32_t fileoffset,
                                    const struct cli_ac_patt *pattern, uint32_t pp, uint16_t specialcnt, uint32_t *start, uint32_t *end);
659a8077
 
dda6b057
 /* call only by ac_findmatch_special! Does not handle recursive specials */
 #define AC_MATCH_CHAR2(p,b)                                                             \
     switch(wc = p & CLI_MATCH_METADATA) {                                               \
     case CLI_MATCH_CHAR:                                                                \
         if((unsigned char) p != b)                                                      \
             match = 0;                                                                  \
         break;                                                                          \
                                                                                         \
     case CLI_MATCH_NOCASE:                                                              \
         if((unsigned char)(p & 0xff) != cli_nocase(b))                                  \
             match = 0;                                                                  \
         break;                                                                          \
                                                                                         \
     case CLI_MATCH_IGNORE:                                                              \
         break;                                                                          \
                                                                                         \
     case CLI_MATCH_NIBBLE_HIGH:                                                         \
         if((unsigned char) (p & 0x00f0) != (b & 0xf0))                                  \
             match = 0;                                                                  \
         break;                                                                          \
                                                                                         \
     case CLI_MATCH_NIBBLE_LOW:                                                          \
         if((unsigned char) (p & 0x000f) != (b & 0x0f))                                  \
             match = 0;                                                                  \
         break;                                                                          \
                                                                                         \
     default:                                                                            \
         cli_errmsg("ac_findmatch: Unknown metatype 0x%x\n", wc);                        \
         match = 0;                                                                      \
     }
 
a2345bb5
 /* call only by ac_XX_match_branch! */
 #define AC_MATCH_CHAR(p,b,rev)                                                          \
4ffcf308
     switch(wc = p & CLI_MATCH_METADATA) {                                               \
     case CLI_MATCH_CHAR:                                                                \
         if((unsigned char) p != b)                                                      \
             match = 0;                                                                  \
         break;                                                                          \
                                                                                         \
     case CLI_MATCH_NOCASE:                                                              \
         if((unsigned char)(p & 0xff) != cli_nocase(b))                                  \
             match = 0;                                                                  \
         break;                                                                          \
                                                                                         \
     case CLI_MATCH_IGNORE:                                                              \
         break;                                                                          \
                                                                                         \
     case CLI_MATCH_SPECIAL:                                                             \
         /* >1 = movement, 0 = fail, <1 = resolved in branch */                          \
28a56447
         if((match = ac_findmatch_special(buffer, offset, bp, fileoffset, length,        \
a2345bb5
                                         pattern, i, specialcnt, start, end, rev)) <= 0) \
4ffcf308
             return match;                                                               \
a2345bb5
                                                                                         \
         if (!rev) {                                                                     \
             bp += (match - 1); /* -1 is for bp++ in parent loop */                      \
             specialcnt++;                                                               \
         } else {                                                                        \
             bp = bp + 1 - match; /* +1 is for bp-- in parent loop */                    \
             specialcnt--;                                                               \
         }                                                                               \
                                                                                         \
4ffcf308
         break;                                                                          \
                                                                                         \
     case CLI_MATCH_NIBBLE_HIGH:                                                         \
         if((unsigned char) (p & 0x00f0) != (b & 0xf0))                                  \
             match = 0;                                                                  \
         break;                                                                          \
                                                                                         \
     case CLI_MATCH_NIBBLE_LOW:                                                          \
         if((unsigned char) (p & 0x000f) != (b & 0x0f))                                  \
             match = 0;                                                                  \
         break;                                                                          \
                                                                                         \
     default:                                                                            \
         cli_errmsg("ac_findmatch: Unknown metatype 0x%x\n", wc);                        \
         match = 0;                                                                      \
     }
 
dda6b057
 
659a8077
 /* special handler */
a2345bb5
 inline static int ac_findmatch_special(const unsigned char *buffer, uint32_t offset, uint32_t bp, uint32_t fileoffset, uint32_t length,
                                        const struct cli_ac_patt *pattern, uint32_t pp, uint16_t specialcnt, uint32_t *start, uint32_t *end, int rev)
659a8077
 {
59506ff5
     int match, cmp;
28a56447
     uint16_t j, b = buffer[bp];
dda6b057
     uint16_t wc;
a2345bb5
     uint32_t subbp;
659a8077
     struct cli_ac_special *special = pattern->special_table[specialcnt];
59506ff5
     struct cli_alt_node *alt = NULL;
659a8077
 
     match = special->negative;
 
     switch(special->type) {
59506ff5
     case AC_SPECIAL_ALT_CHAR: /* single-byte */
         for (j = 0; j < special->num; j++) {
bb50eef3
             cmp = b - (special->alt).byte[j];
cdd018d5
             if (cmp == 0) {
9290ddf2
                 match = !special->negative;
                 break;
bb50eef3
             } else if (cmp < 0)
9290ddf2
                 break;
659a8077
         }
         break;
 
59506ff5
     case AC_SPECIAL_ALT_STR_FIXED: /* fixed length multi-byte */
a2345bb5
         if (!rev) {
             if (bp + special->len[0] > length)
                 break;
             subbp = bp;
         } else {
             if (bp < (special->len[0] - 1))
                 break;
             subbp = bp - (special->len[0] - 1);
         }
9290ddf2
 
b7d0b832
         match *= special->len[0];
9290ddf2
         for (j = 0; j < special->num; j++) {
a2345bb5
             cmp = memcmp(&buffer[subbp], (special->alt).f_str[j], special->len[0]);
cdd018d5
             if (cmp == 0) {
b7d0b832
                 match = (!special->negative) * special->len[0];
9290ddf2
                 break;
bb50eef3
             } else if (cmp < 0)
cdd018d5
                 break;
9290ddf2
         }
2b512658
         break;
 
     case AC_SPECIAL_ALT_STR: /* generic */
9290ddf2
         alt = (special->alt).v_str;
         while (alt) {
a2345bb5
             if (!rev) {
                 if (bp + alt->len > length) {
                     alt = alt->next;
                     continue;
                 }
                 subbp = bp;
             } else {
                 if (bp < (alt->len - 1)) {
                     alt = alt->next;
                     continue;
                 }
                 subbp = bp - (alt->len - 1);
9290ddf2
             }
 
             /* note that generic alternates CANNOT be negated */
dda6b057
             match = 1;
             for (j = 0; j < alt->len; j++) {
a2345bb5
                 AC_MATCH_CHAR2(alt->str[j],buffer[subbp+j]);
dda6b057
                 if (!match)
                     break;
             }
             if (match) {
590d4023
                 /* if match is unique (has no derivatives), we can pass it directly back */
                 if (alt->unique) {
                     match = alt->len;
                     break;
                 }
4ffcf308
                 /* branch for backtracking */
a2345bb5
                 if (!rev)
                     match = ac_forward_match_branch(buffer, subbp+alt->len, offset, fileoffset, length, pattern, pp+1, specialcnt+1, start, end);
                 else
                     match = ac_backward_match_branch(buffer, subbp-1, offset, fileoffset, length, pattern, pp-1, specialcnt-1, start, end);
9290ddf2
                 if (match)
                     return -1; /* alerts caller that match has been resolved in child callee */
dda6b057
             }
9290ddf2
 
             alt = alt->next;
         }
         break;
659a8077
 
     case AC_SPECIAL_LINE_MARKER:
         if(b == '\n')
             match = !special->negative;
28a56447
         else if(b == '\r' && (bp + 1 < length && buffer[bp + 1] == '\n'))
2b512658
             match = (!special->negative) * 2;
659a8077
         break;
 
     case AC_SPECIAL_BOUNDARY:
         if(boundary[b])
             match = !special->negative;
         break;
 
     case AC_SPECIAL_WORD_MARKER:
         if(!isalnum(b))
             match = !special->negative;
         break;
 
     default:
         cli_errmsg("ac_findmatch: Unknown special\n");
         match = 0;
     }
 
     return match;
 }
 
 /* state should reset on call, recursion depth = number of alternate specials */
a2345bb5
 /* each loop iteration starts on the NEXT sequence to be validated */
 static int ac_backward_match_branch(const unsigned char *buffer, uint32_t bp, uint32_t offset, uint32_t fileoffset, uint32_t length,
                                     const struct cli_ac_patt *pattern, uint32_t pp, uint16_t specialcnt, uint32_t *start, uint32_t *end)
659a8077
 {
927b2bab
     int match = 0;
659a8077
     uint16_t wc, i;
a2345bb5
     uint32_t filestart;
2242da43
 
a2345bb5
     /* backwards (prefix) validation, determines start */
47bccd1b
     if(pattern->prefix && pattern->prefix_length[0]) {
a2345bb5
         match = 1;
e772c090
 
a2345bb5
         for (i = pp; 1; i--) {
             AC_MATCH_CHAR(pattern->prefix[i],buffer[bp],1);
             if(!match)
                 return 0;
 
             /* needs to perform check before decrement due to unsignedness */
             if (i == 0 || bp == 0)
                 break;
 
             bp--;
         }
 
         *start = bp;
         filestart = fileoffset - offset + bp;
     } else {
         /* bp is set to buffer offset */
         *start = bp = offset;
         filestart = fileoffset;
8000d078
     }
 
a2345bb5
     /* left-side special checks, bp = start */
8c3c77b4
     if(pattern->boundary & AC_BOUNDARY_LEFT) {
e772c090
         match = !!(pattern->boundary & AC_BOUNDARY_LEFT_NEGATIVE);
a2345bb5
         if(!filestart || (bp && (boundary[buffer[bp - 1]] == 1 || boundary[buffer[bp - 1]] == 3)))
e772c090
             match = !match;
 
         if(!match)
             return 0;
8c3c77b4
     }
 
a2345bb5
     if(pattern->boundary & AC_LINE_MARKER_LEFT) {
         match = !!(pattern->boundary & AC_LINE_MARKER_LEFT_NEGATIVE);
         if(!filestart || (bp && (buffer[bp - 1] == '\n')))
e772c090
             match = !match;
 
         if(!match)
             return 0;
8c3c77b4
     }
 
a2345bb5
 
     if(pattern->boundary & AC_WORD_MARKER_LEFT) {
         match = !!(pattern->boundary & AC_WORD_MARKER_LEFT_NEGATIVE);
         if(!filestart)
             match = !match;
         else if(pattern->sigopts & ACPATT_OPTION_WIDE) {
             if(filestart-1 == 0)
                 match = !match;
             if(bp - 1 && bp && !(isalnum(buffer[bp - 2]) && buffer[bp - 1] == '\0'))
                 match = !match;
         }
         else if(bp && !isalnum(buffer[bp - 1]))
e772c090
             match = !match;
 
         if(!match)
             return 0;
723a44d5
     }
 
a2345bb5
     /* bp is shifted for left anchor check, thus invalidated as pattern start */
     if(!(pattern->ch[0] & CLI_MATCH_IGNORE)) {
         if(pattern->ch_mindist[0] + (uint32_t) 1 > bp)
             return 0;
 
         bp -= pattern->ch_mindist[0] + 1;
         for(i = pattern->ch_mindist[0]; i <= pattern->ch_maxdist[0]; i++) {
             match = 1;
             AC_MATCH_CHAR(pattern->ch[0],buffer[bp],1);
             if(match)
                 break;
e772c090
 
a2345bb5
             if(!bp)
                 return 0;
             else
                 bp--;
         }
e772c090
         if(!match)
             return 0;
723a44d5
     }
 
a2345bb5
     return 1;
 }
 
 /* state should reset on call, recursion depth = number of alternate specials */
 /* each loop iteration starts on the NEXT sequence to validate */
 static int ac_forward_match_branch(const unsigned char *buffer, uint32_t bp, uint32_t offset, uint32_t fileoffset, uint32_t length,
                                    const struct cli_ac_patt *pattern, uint32_t pp, uint16_t specialcnt, uint32_t *start, uint32_t *end)
 {
     int match;
     uint16_t wc, i;
 
     match = 1;
 
     /* forward (pattern) validation; determines end */
     for(i = pp; i < pattern->length[0] && bp < length; i++) {
         AC_MATCH_CHAR(pattern->pattern[i],buffer[bp],0);
         if (!match)
             return 0;
 
         bp++;
     }
     *end = bp;
 
     /* right-side special checks, bp = end */
     if(pattern->boundary & AC_BOUNDARY_RIGHT) {
         match = !!(pattern->boundary & AC_BOUNDARY_RIGHT_NEGATIVE);
         if((length <= SCANBUFF) && (bp == length || boundary[buffer[bp]] >= 2))
f22d89ee
             match = !match;
a2345bb5
 
         if(!match)
             return 0;
     }
 
     if(pattern->boundary & AC_LINE_MARKER_RIGHT) {
         match = !!(pattern->boundary & AC_LINE_MARKER_RIGHT_NEGATIVE);
         if((length <= SCANBUFF) && (bp == length || buffer[bp] == '\n' || (buffer[bp] == '\r' && bp + 1 < length && buffer[bp + 1] == '\n')))
6b725bb7
             match = !match;
 
         if(!match)
             return 0;
     }
 
     if(pattern->boundary & AC_WORD_MARKER_RIGHT) {
         match = !!(pattern->boundary & AC_WORD_MARKER_RIGHT_NEGATIVE);
f22d89ee
         if(length <= SCANBUFF) {
             if(bp == length)
                 match = !match;
d2e77863
             else if((pattern->sigopts & ACPATT_OPTION_WIDE) && (bp+1 < length)) {
f22d89ee
                 if(!(isalnum(buffer[bp]) && buffer[bp + 1] == '\0'))
                     match = !match;
             }
d2e77863
             else if(!isalnum(buffer[bp]))
f22d89ee
                 match = !match;
         }
6b725bb7
 
         if(!match)
             return 0;
     }
 
a2345bb5
     /* bp is shifted for right anchor check, thus invalidated as pattern right-side */
1a2906f4
     if(!(pattern->ch[1] & CLI_MATCH_IGNORE)) {
e772c090
         bp += pattern->ch_mindist[1];
 
         for(i = pattern->ch_mindist[1]; i <= pattern->ch_maxdist[1]; i++) {
             if(bp >= length)
                 return 0;
 
             match = 1;
a2345bb5
             AC_MATCH_CHAR(pattern->ch[1],buffer[bp],0);
e772c090
             if(match)
                 break;
 
             bp++;
         }
 
         if(!match)
             return 0;
1a2906f4
     }
 
a2345bb5
     return ac_backward_match_branch(buffer, offset-1, offset, fileoffset, length, pattern, pattern->prefix_length[0]-1, pattern->special_pattern-1, start, end);
8000d078
 }
 
a2345bb5
 inline static int ac_findmatch(const unsigned char *buffer, uint32_t offset, uint32_t fileoffset, uint32_t length, const struct cli_ac_patt *pattern, uint32_t *start, uint32_t *end)
659a8077
 {
     int match;
     uint16_t specialcnt = pattern->special_pattern;
 
a2345bb5
     /* minimal check as the maximum variable length may exceed the buffer */
600c04f0
     if((offset + pattern->length[1] > length) || (pattern->prefix_length[1] > offset))
659a8077
         return 0;
 
a2345bb5
     match = ac_forward_match_branch(buffer, offset+pattern->depth, offset, fileoffset, length, pattern, pattern->depth, specialcnt, start, end);
659a8077
     if(match)
9290ddf2
         return 1;
659a8077
     return 0;
 }
 
aca9ea82
 int cli_ac_initdata(struct cli_ac_data *data, uint32_t partsigs, uint32_t lsigs, uint32_t reloffsigs, uint8_t tracklen)
4e9ab8ed
 {
e772c090
     unsigned int i, j;
677fc4ba
 
cd94be7a
     UNUSEDPARAM(tracklen);
4e9ab8ed
 
     if(!data) {
e772c090
         cli_errmsg("cli_ac_init: data == NULL\n");
         return CL_ENULLARG;
4e9ab8ed
     }
c1206103
     memset((void *)data, 0, sizeof(struct cli_ac_data));
4e9ab8ed
 
aca9ea82
     data->reloffsigs = reloffsigs;
     if(reloffsigs) {
e772c090
         data->offset = (uint32_t *) cli_malloc(reloffsigs * 2 * sizeof(uint32_t));
         if(!data->offset) {
             cli_errmsg("cli_ac_init: Can't allocate memory for data->offset\n");
             return CL_EMEM;
         }
         for(i = 0; i < reloffsigs * 2; i += 2)
             data->offset[i] = CLI_OFF_NONE;
aca9ea82
     }
4e9ab8ed
 
aca9ea82
     data->partsigs = partsigs;
677fc4ba
     if(partsigs) {
d0cba11e
         data->offmatrix = (uint32_t ***) cli_calloc(partsigs, sizeof(uint32_t **));
e772c090
         if(!data->offmatrix) {
             cli_errmsg("cli_ac_init: Can't allocate memory for data->offmatrix\n");
 
             if(reloffsigs)
                 free(data->offset);
 
             return CL_EMEM;
         }
4e9ab8ed
     }
677fc4ba
  
     data->lsigs = lsigs;
     if(lsigs) {
e772c090
         data->lsigcnt = (uint32_t **) cli_malloc(lsigs * sizeof(uint32_t *));
         if(!data->lsigcnt) {
             if(partsigs)
                 free(data->offmatrix);
 
             if(reloffsigs)
                 free(data->offset);
 
             cli_errmsg("cli_ac_init: Can't allocate memory for data->lsigcnt\n");
             return CL_EMEM;
         }
         data->lsigcnt[0] = (uint32_t *) cli_calloc(lsigs * 64, sizeof(uint32_t));
         if(!data->lsigcnt[0]) {
             free(data->lsigcnt);
             if(partsigs)
                 free(data->offmatrix);
 
             if(reloffsigs)
                 free(data->offset);
 
             cli_errmsg("cli_ac_init: Can't allocate memory for data->lsigcnt[0]\n");
             return CL_EMEM;
         }
         for(i = 1; i < lsigs; i++)
             data->lsigcnt[i] = data->lsigcnt[0] + 64 * i;
7665e02d
         data->yr_matches = (uint8_t *) cli_calloc(lsigs, sizeof(uint8_t));
         if (data->yr_matches == NULL) {
             free(data->lsigcnt[0]);
             free(data->lsigcnt);
             if(partsigs)
                 free(data->offmatrix);
             
             if(reloffsigs)
                 free(data->offset);
             return CL_EMEM;
         }
e772c090
 
         /* subsig offsets */
7665e02d
         data->lsig_matches = (struct cli_lsig_matches **) cli_calloc(lsigs, sizeof(struct cli_lsig_matches *));
b7999b89
         if(!data->lsig_matches) {
7665e02d
             free(data->yr_matches);
b7999b89
             free(data->lsigcnt[0]);
             free(data->lsigcnt);
             if(partsigs)
                 free(data->offmatrix);
 
             if(reloffsigs)
                 free(data->offset);
 
             cli_errmsg("cli_ac_init: Can't allocate memory for data->lsig_matches\n");
             return CL_EMEM;
         }
e772c090
         data->lsigsuboff_last = (uint32_t **) cli_malloc(lsigs * sizeof(uint32_t *));
         data->lsigsuboff_first = (uint32_t **) cli_malloc(lsigs * sizeof(uint32_t *));
         if(!data->lsigsuboff_last || !data->lsigsuboff_first) {
b7999b89
             free(data->lsig_matches);
e772c090
             free(data->lsigsuboff_last);
             free(data->lsigsuboff_first);
7665e02d
             free(data->yr_matches);
e772c090
             free(data->lsigcnt[0]);
             free(data->lsigcnt);
             if(partsigs)
                 free(data->offmatrix);
 
             if(reloffsigs)
                 free(data->offset);
 
             cli_errmsg("cli_ac_init: Can't allocate memory for data->lsigsuboff_(last|first)\n");
             return CL_EMEM;
         }
         data->lsigsuboff_last[0] = (uint32_t *) cli_calloc(lsigs * 64, sizeof(uint32_t));
         data->lsigsuboff_first[0] = (uint32_t *) cli_calloc(lsigs * 64, sizeof(uint32_t));
         if(!data->lsigsuboff_last[0] || !data->lsigsuboff_first[0]) {
b7999b89
             free(data->lsig_matches);
e772c090
             free(data->lsigsuboff_last[0]);
             free(data->lsigsuboff_first[0]);
             free(data->lsigsuboff_last);
             free(data->lsigsuboff_first);
7665e02d
             free(data->yr_matches);
e772c090
             free(data->lsigcnt[0]);
             free(data->lsigcnt);
             if(partsigs)
                 free(data->offmatrix);
 
             if(reloffsigs)
                 free(data->offset);
 
             cli_errmsg("cli_ac_init: Can't allocate memory for data->lsigsuboff_(last|first)[0]\n");
             return CL_EMEM;
         }
         for(j = 0; j < 64; j++) {
             data->lsigsuboff_last[0][j] = CLI_OFF_NONE;
             data->lsigsuboff_first[0][j] = CLI_OFF_NONE;
         }
         for(i = 1; i < lsigs; i++) {
             data->lsigsuboff_last[i] = data->lsigsuboff_last[0] + 64 * i;
             data->lsigsuboff_first[i] = data->lsigsuboff_first[0] + 64 * i;
             for(j = 0; j < 64; j++) {
                 data->lsigsuboff_last[i][j] = CLI_OFF_NONE;
                 data->lsigsuboff_first[i][j] = CLI_OFF_NONE;
             }
         }
aca9ea82
     }
ab893605
     for (i=0;i<32;i++)
e772c090
         data->macro_lastmatch[i] = CLI_OFF_NONE;
aca9ea82
 
b87fe385
     data->min_partno = 1;
 
fbcef1b0
     return CL_SUCCESS;
 }
4e9ab8ed
 
294558a5
 int cli_ac_caloff(const struct cli_matcher *root, struct cli_ac_data *data, const struct cli_target_info *info)
33872a43
 {
e772c090
     int ret;
     unsigned int i;
     struct cli_ac_patt *patt;
33872a43
 
04ec2e19
     if(info)
e772c090
         data->vinfo = &info->exeinfo.vinfo;
d2ba6f98
 
33872a43
     for(i = 0; i < root->ac_reloff_num; i++) {
e772c090
         patt = root->ac_reloff[i];
         if(!info) {
             data->offset[patt->offset_min] = CLI_OFF_NONE;
         } else if((ret = cli_caloff(NULL, info, root->type, patt->offdata, &data->offset[patt->offset_min], &data->offset[patt->offset_max]))) {
             cli_errmsg("cli_ac_caloff: Can't calculate relative offset in signature for %s\n", patt->virname);
             return ret;
600c04f0
         } else if((data->offset[patt->offset_min] != CLI_OFF_NONE) && (data->offset[patt->offset_min] + patt->length[1] > info->fsize)) {
e772c090
             data->offset[patt->offset_min] = CLI_OFF_NONE;
         }
33872a43
     }
 
     return CL_SUCCESS;
 }
 
fbcef1b0
 void cli_ac_freedata(struct cli_ac_data *data)
 {
e772c090
     uint32_t i;
4e9ab8ed
 
b7999b89
     if (!data)
         return;
 
     if(data->partsigs) {
e772c090
         for(i = 0; i < data->partsigs; i++) {
             if(data->offmatrix[i]) {
                 free(data->offmatrix[i][0]);
                 free(data->offmatrix[i]);
             }
         }
         free(data->offmatrix);
         data->offmatrix = NULL;
         data->partsigs = 0;
677fc4ba
     }
 
b7999b89
     if(data->lsigs) {
         if (data->lsig_matches) {
             for (i = 0; i < data->lsigs; i++) {
                 struct cli_lsig_matches * ls_matches;
                 if ((ls_matches = data->lsig_matches[i])) {
                     uint32_t j;
                     for (j = 0; j < ls_matches->subsigs; j++) {
                         if (ls_matches->matches[j]) {
                             free(ls_matches->matches[j]);
                             ls_matches->matches[j] = 0;
                         }
                     }
                     free(data->lsig_matches[i]);
                     data->lsig_matches[i] = 0;
                 }
             }
             free(data->lsig_matches);
             data->lsig_matches = 0;
         }
7665e02d
         free(data->yr_matches);
e772c090
         free(data->lsigcnt[0]);
         free(data->lsigcnt);
         free(data->lsigsuboff_last[0]);
         free(data->lsigsuboff_last);
         free(data->lsigsuboff_first[0]);
         free(data->lsigsuboff_first);
         data->lsigs = 0;
227f8f7c
     }
aca9ea82
 
b7999b89
     if(data->reloffsigs) {
e772c090
         free(data->offset);
         data->reloffsigs = 0;
aca9ea82
     }
fbcef1b0
 }
227f8f7c
 
aec1e3be
 /* returns only CL_SUCCESS or CL_EMEM */
5025967e
 inline static int ac_addtype(struct cli_matched_type **list, cli_file_t type, off_t offset, const cli_ctx *ctx)
fbcef1b0
 {
e772c090
     struct cli_matched_type *tnode, *tnode_last;
4e9ab8ed
 
 
5025967e
     if(type == CL_TYPE_ZIPSFX) {
e772c090
         if(*list && ctx && ctx->engine->maxfiles && (*list)->cnt > ctx->engine->maxfiles)
             return CL_SUCCESS;
     } else if(*list && (*list)->cnt >= MAX_EMBEDDED_OBJ) {
         return CL_SUCCESS;
     }
4e9ab8ed
 
fbcef1b0
     if(!(tnode = cli_calloc(1, sizeof(struct cli_matched_type)))) {
e772c090
         cli_errmsg("cli_ac_addtype: Can't allocate memory for new type node\n");
         return CL_EMEM;
4e9ab8ed
     }
 
fbcef1b0
     tnode->type = type;
     tnode->offset = offset;
4e9ab8ed
 
fbcef1b0
     tnode_last = *list;
     while(tnode_last && tnode_last->next)
e772c090
         tnode_last = tnode_last->next;
4e9ab8ed
 
fbcef1b0
     if(tnode_last)
e772c090
         tnode_last->next = tnode;
fbcef1b0
     else
e772c090
         *list = tnode;
4e9ab8ed
 
fbcef1b0
     (*list)->cnt++;
4e9ab8ed
     return CL_SUCCESS;
 }
 
b7999b89
 int lsig_sub_matched(const struct cli_matcher *root, struct cli_ac_data *mdata, uint32_t lsigid1, uint32_t lsigid2, uint32_t realoff, int partial)
ab893605
 {
b7999b89
     const struct cli_ac_lsig *ac_lsig = root->ac_lsigtable[lsigid1];
     const struct cli_lsig_tdb *tdb = &ac_lsig->tdb;
70b3c2cc
 
     if(realoff != CLI_OFF_NONE) {
e772c090
         if(mdata->lsigsuboff_first[lsigid1][lsigid2] == CLI_OFF_NONE)
             mdata->lsigsuboff_first[lsigid1][lsigid2] = realoff;
 
         if(mdata->lsigsuboff_last[lsigid1][lsigid2] != CLI_OFF_NONE && ((!partial && realoff <= mdata->lsigsuboff_last[lsigid1][lsigid2]) || (partial && realoff < mdata->lsigsuboff_last[lsigid1][lsigid2])))
b7999b89
             return CL_SUCCESS;
e772c090
 
         mdata->lsigcnt[lsigid1][lsigid2]++;
         if(mdata->lsigcnt[lsigid1][lsigid2] <= 1 || !tdb->macro_ptids || !tdb->macro_ptids[lsigid2])
             mdata->lsigsuboff_last[lsigid1][lsigid2] = realoff;
70b3c2cc
     }
94f8946c
 
b7999b89
     if (ac_lsig->type & CLI_YARA_OFFSET && realoff != CLI_OFF_NONE) {
         struct cli_subsig_matches * ss_matches;
         struct cli_lsig_matches * ls_matches;
         cli_dbgmsg("lsig_sub_matched lsig %u:%u at %u\n", lsigid1, lsigid2, realoff);
 
         ls_matches = mdata->lsig_matches[lsigid1];
         if (ls_matches == NULL) { /* allocate cli_lsig_matches */
             ls_matches = mdata->lsig_matches[lsigid1] = (struct cli_lsig_matches *)cli_calloc(1, sizeof(struct cli_lsig_matches) +
                                                                                               (ac_lsig->tdb.subsigs - 1) * sizeof(struct cli_subsig_matches *));
             if (ls_matches == NULL) {
                 cli_errmsg("lsig_sub_matched: cli_calloc failed for cli_lsig_matches\n");
                 return CL_EMEM;
             }
             ls_matches->subsigs = ac_lsig->tdb.subsigs;
         }
         ss_matches = ls_matches->matches[lsigid2];
         if (ss_matches == NULL) { /*  allocate cli_subsig_matches */
             ss_matches = ls_matches->matches[lsigid2] = cli_malloc(sizeof(struct cli_subsig_matches));
             if (ss_matches == NULL) {
                 cli_errmsg("lsig_sub_matched: cli_malloc failed for cli_subsig_matches struct\n");
                 return CL_EMEM;
             }
             ss_matches->next = 0;
             ss_matches->last = sizeof(ss_matches->offsets) / sizeof(uint32_t) - 1; 
         }
         if (ss_matches->next > ss_matches->last) {  /* cli_matches out of space? realloc */
             ss_matches = ls_matches->matches[lsigid2] = cli_realloc(ss_matches, sizeof(struct cli_subsig_matches) + sizeof(uint32_t) * ss_matches->last * 2);
             if (ss_matches == NULL) {
                 cli_errmsg("lsig_sub_matched: cli_realloc failed for cli_subsig_matches struct\n");
                 return CL_EMEM;
             }
             ss_matches->last = sizeof(ss_matches->offsets)/ sizeof(uint32_t) + ss_matches->last * 2 - 1;
         }
         
         ss_matches->offsets[ss_matches->next] = realoff; /* finally, store the offset */
         ss_matches->next++;
     }
 
70b3c2cc
     if (mdata->lsigcnt[lsigid1][lsigid2] > 1) {
e772c090
         /* Check that the previous match had a macro match following it at the 
          * correct distance. This check is only done after the 1st match.*/
         const struct cli_ac_patt *macropt;
         uint32_t id, last_macro_match, smin, smax, last_macroprev_match;
 
         if (!tdb->macro_ptids)
b7999b89
             return CL_SUCCESS;
e772c090
 
         id = tdb->macro_ptids[lsigid2];
         if (!id)
b7999b89
             return CL_SUCCESS;
e772c090
 
         macropt = root->ac_pattable[id];
         smin = macropt->ch_mindist[0];
         smax = macropt->ch_maxdist[0];
         /* start of last macro match */
         last_macro_match = mdata->macro_lastmatch[macropt->sigid];
         /* start of previous lsig subsig match */
         last_macroprev_match = mdata->lsigsuboff_last[lsigid1][lsigid2];
         if (last_macro_match != CLI_OFF_NONE)
             cli_dbgmsg("Checking macro match: %u + (%u - %u) == %u\n",
9290ddf2
                        last_macroprev_match, smin, smax, last_macro_match);
e772c090
 
         if (last_macro_match == CLI_OFF_NONE ||
             last_macroprev_match + smin > last_macro_match ||
             last_macroprev_match + smax < last_macro_match) {
             cli_dbgmsg("Canceled false lsig macro match\n");
             /* Previous match was false - cancel it */
             mdata->lsigcnt[lsigid1][lsigid2]--;
             mdata->lsigsuboff_last[lsigid1][lsigid2] = realoff;
         } else {
             /* mark the macro sig itself matched */
             mdata->lsigcnt[lsigid1][lsigid2+1]++;
             mdata->lsigsuboff_last[lsigid1][lsigid2+1] = last_macro_match;
         }
ab893605
     }
b7999b89
     return CL_SUCCESS;
ab893605
 }
 
b7999b89
 int cli_ac_chkmacro(struct cli_matcher *root, struct cli_ac_data *data, unsigned lsigid1)
ab893605
 {
     const struct cli_lsig_tdb *tdb = &root->ac_lsigtable[lsigid1]->tdb;
     unsigned i;
b7999b89
     int rc;
 
ab893605
     /* Loop through all subsigs, and if they are tied to macros check that the
      * macro matched at a correct distance */
     for (i=0;i<tdb->subsigs;i++) {
b7999b89
         rc = lsig_sub_matched(root, data, lsigid1, i, CLI_OFF_NONE, 0);
         if (rc != CL_SUCCESS)
             return rc;
ab893605
     }
b7999b89
     return CL_SUCCESS;
ab893605
 }
 
 
d0cba11e
 int cli_ac_scanbuff(
     const unsigned char *buffer, 
     uint32_t length, 
     const char **virname, 
     void **customdata, 
     struct cli_ac_result **res, 
     const struct cli_matcher *root, 
     struct cli_ac_data *mdata, 
     uint32_t offset, 
     cli_file_t ftype, 
     struct cli_matched_type **ftoffset, 
     unsigned int mode, 
     cli_ctx *ctx)
8000d078
 {
e772c090
     struct cli_ac_node *current;
3e265c46
     struct cli_ac_list *pattN, *ptN;
e772c090
     struct cli_ac_patt *patt, *pt;
a2345bb5
     uint32_t i, bp, exptoff[2], realoff, matchstart, matchend;
e772c090
     uint16_t j;
     uint8_t found, viruses_found = 0;
d0cba11e
     uint32_t **offmatrix, swp;
e772c090
     int type = CL_CLEAN;
     struct cli_ac_result *newres;
b7999b89
     int rc;
8000d078
 
cdbf8c8e
     if(!root->ac_root)
e772c090
         return CL_CLEAN;
8000d078
 
04133ff9
     if(!mdata && (root->ac_partsigs || root->ac_lsigs || root->ac_reloff_num)) {
e772c090
         cli_errmsg("cli_ac_scanbuff: mdata == NULL\n");
         return CL_ENULLARG;
8000d078
     }
 
     current = root->ac_root;
 
     for(i = 0; i < length; i++)  {
23d7c6e6
         current = current->trans[buffer[i]];
e772c090
 
         if(UNLIKELY(IS_FINAL(current))) {
3e265c46
             struct cli_ac_list *faillist = current->fail->list;
51ca644c
             pattN = current->list;
             while(pattN) {
                 patt = pattN->me;
e772c090
                 if(patt->partno > mdata->min_partno) {
51ca644c
                     pattN = faillist;
e772c090
                     faillist = NULL;
                     continue;
                 }
                 bp = i + 1 - patt->depth;
51ca644c
                 if(patt->offdata[0] != CLI_OFF_VERSION && patt->offdata[0] != CLI_OFF_MACRO && !pattN->next_same && (patt->offset_min != CLI_OFF_ANY) && (!patt->sigid || patt->partno == 1)) {
e772c090
                     if(patt->offset_min == CLI_OFF_NONE) {
51ca644c
                         pattN = pattN->next;
e772c090
                         continue;
                     }
a2345bb5
                     exptoff[0] = offset + bp - patt->prefix_length[2]; /* lower offset end */
                     exptoff[1] = offset + bp - patt->prefix_length[1]; /* higher offset end */
e772c090
                     if(patt->offdata[0] == CLI_OFF_ABSOLUTE) {
a2345bb5
                         if(patt->offset_max < exptoff[0] || patt->offset_min > exptoff[1]) {
51ca644c
                             pattN = pattN->next;
e772c090
                             continue;
                         }
                     } else {
a2345bb5
                         if(mdata->offset[patt->offset_min] == CLI_OFF_NONE || mdata->offset[patt->offset_max] < exptoff[0] || mdata->offset[patt->offset_min] > exptoff[1]) {
51ca644c
                             pattN = pattN->next;
e772c090
                             continue;
                         }
                     }
                 }
 
51ca644c
                 ptN = pattN;
a2345bb5
                 if(ac_findmatch(buffer, bp, offset + bp, length, patt, &matchstart, &matchend)) {
51ca644c
                     while(ptN) {
                         pt = ptN->me;
e772c090
                         if(pt->partno > mdata->min_partno)
                             break;
 
                         if((pt->type && !(mode & AC_SCAN_FT)) || (!pt->type && !(mode & AC_SCAN_VIR))) {
51ca644c
                             ptN = ptN->next_same;
e772c090
                             continue;
                         }
 
a2345bb5
                         realoff = offset + matchstart;
e772c090
                         if(pt->offdata[0] == CLI_OFF_VERSION) {
                             if(!cli_hashset_contains_maybe_noalloc(mdata->vinfo, realoff)) {
51ca644c
                                 ptN = ptN->next_same;
e772c090
                                 continue;
                             }
                             cli_dbgmsg("cli_ac_scanbuff: VI match for offset %x\n", realoff);
                         } else if(pt->offdata[0] == CLI_OFF_MACRO) {
                             mdata->macro_lastmatch[patt->offdata[1]] = realoff;
51ca644c
                             ptN = ptN->next_same;
e772c090
                             continue;
                         } else if(pt->offset_min != CLI_OFF_ANY && (!pt->sigid || pt->partno == 1)) {
                             if(pt->offset_min == CLI_OFF_NONE) {
51ca644c
                                 ptN = ptN->next_same;
e772c090
                                 continue;
                             }
                             if(pt->offdata[0] == CLI_OFF_ABSOLUTE) {
                                 if(pt->offset_max < realoff || pt->offset_min > realoff) {
51ca644c
                                     ptN = ptN->next_same;
e772c090
                                     continue;
                                 }
                             } else {
                                 if(mdata->offset[pt->offset_min] == CLI_OFF_NONE || mdata->offset[pt->offset_max] < realoff || mdata->offset[pt->offset_min] > realoff) {
51ca644c
                                     ptN = ptN->next_same;
e772c090
                                     continue;
                                 }
                             }
                         }
 
                         if(pt->sigid) { /* it's a partial signature */
 
                             /* if 2nd or later part, confirm some prior part has matched */
                             if(pt->partno != 1 && (!mdata->offmatrix[pt->sigid - 1] || !mdata->offmatrix[pt->sigid - 1][pt->partno - 2][0])) {
51ca644c
                                 ptN = ptN->next_same;
e772c090
                                 continue;
                             }
 
                             if(pt->partno + 1 > mdata->min_partno)
                                 mdata->min_partno = pt->partno + 1;
 
                             /* sparsely populated matrix, so allocate and initialize if NULL */
                             if(!mdata->offmatrix[pt->sigid - 1]) {
                                 mdata->offmatrix[pt->sigid - 1] = cli_malloc(pt->parts * sizeof(int32_t *));
                                 if(!mdata->offmatrix[pt->sigid - 1]) {
                                     cli_errmsg("cli_ac_scanbuff: Can't allocate memory for mdata->offmatrix[%u]\n", pt->sigid - 1);
                                     return CL_EMEM;
                                 }
 
d0cba11e
                                 mdata->offmatrix[pt->sigid - 1][0] = cli_malloc(pt->parts * (CLI_DEFAULT_AC_TRACKLEN + 2) * sizeof(uint32_t));
e772c090
                                 if(!mdata->offmatrix[pt->sigid - 1][0]) {
                                     cli_errmsg("cli_ac_scanbuff: Can't allocate memory for mdata->offmatrix[%u][0]\n", pt->sigid - 1);
                                     free(mdata->offmatrix[pt->sigid - 1]);
                                     mdata->offmatrix[pt->sigid - 1] = NULL;
                                     return CL_EMEM;
                                 }
d0cba11e
                                 memset(mdata->offmatrix[pt->sigid - 1][0], (uint32_t)-1, pt->parts * (CLI_DEFAULT_AC_TRACKLEN + 2) * sizeof(uint32_t));
e772c090
                                 mdata->offmatrix[pt->sigid - 1][0][0] = 0;
                                 for(j = 1; j < pt->parts; j++) {
                                     mdata->offmatrix[pt->sigid - 1][j] = mdata->offmatrix[pt->sigid - 1][0] + j * (CLI_DEFAULT_AC_TRACKLEN + 2);
                                     mdata->offmatrix[pt->sigid - 1][j][0] = 0;
                                 }
                             }
                             offmatrix = mdata->offmatrix[pt->sigid - 1];
 
                             found = 0;
                             if(pt->partno != 1) {
cc12e21d
                                 for(j = 1; (j <= CLI_DEFAULT_AC_TRACKLEN + 1) && (offmatrix[pt->partno - 2][j] != (uint32_t)-1); j++) {
e772c090
                                     found = j;
f37565c3
                                     if(realoff < offmatrix[pt->partno - 2][j])
                                         found = 0;
 
                                     if(found && pt->maxdist)
e772c090
                                         if(realoff - offmatrix[pt->partno - 2][j] > pt->maxdist)
                                             found = 0;
 
                                     if(found && pt->mindist)
                                         if(realoff - offmatrix[pt->partno - 2][j] < pt->mindist)
                                             found = 0;
 
                                     if(found)
                                         break;
                                 }
                             }
 
                             if(pt->partno == 2 && found > 1) {
                                 swp = offmatrix[0][1];
                                 offmatrix[0][1] = offmatrix[0][found];
                                 offmatrix[0][found] = swp;
 
                                 if(pt->type != CL_TYPE_MSEXE) {
                                     swp = offmatrix[pt->parts - 1][1];
                                     offmatrix[pt->parts - 1][1] = offmatrix[pt->parts - 1][found];
                                     offmatrix[pt->parts - 1][found] = swp;
                                 }
                             }
 
                             if(pt->partno == 1 || (found && (pt->partno != pt->parts))) {
                                 if(offmatrix[pt->partno - 1][0] == CLI_DEFAULT_AC_TRACKLEN + 1)
                                     offmatrix[pt->partno - 1][0] = 1; /* wrap, ends up at 2 */
                                 offmatrix[pt->partno - 1][0]++;
                                 offmatrix[pt->partno - 1][offmatrix[pt->partno - 1][0]] = offset + matchend;
 
                                 if(pt->partno == 1) /* save realoff for the first part */
                                     offmatrix[pt->parts - 1][offmatrix[pt->partno - 1][0]] = realoff;
                             } else if(found && pt->partno == pt->parts) {
                                 if(pt->type) {
 
                                     if(pt->type == CL_TYPE_IGNORED && (!pt->rtype || ftype == pt->rtype))
                                         return CL_TYPE_IGNORED;
 
                                     if((pt->type > type || pt->type >= CL_TYPE_SFX || pt->type == CL_TYPE_MSEXE) && (!pt->rtype || ftype == pt->rtype)) {
                                         cli_dbgmsg("Matched signature for file type %s\n", pt->virname);
                                         type = pt->type;
                                         if(ftoffset && (!*ftoffset || (*ftoffset)->cnt < MAX_EMBEDDED_OBJ || type == CL_TYPE_ZIPSFX) && (type >= CL_TYPE_SFX || ((ftype == CL_TYPE_MSEXE || ftype == CL_TYPE_ZIP || ftype == CL_TYPE_MSOLE2) && type == CL_TYPE_MSEXE)))  {
                                             /* FIXME: the first offset in the array is most likely the correct one but
                                              * it may happen it is not
                                              */
d0cba11e
                                             for(j = 1; j <= CLI_DEFAULT_AC_TRACKLEN + 1 && offmatrix[0][j] != (uint32_t)-1; j++)
e772c090
                                                 if(ac_addtype(ftoffset, type, offmatrix[pt->parts - 1][j], ctx))
                                                     return CL_EMEM;
                                         }
 
d0cba11e
                                         memset(offmatrix[0], (uint32_t)-1, pt->parts * (CLI_DEFAULT_AC_TRACKLEN + 2) * sizeof(uint32_t));
e772c090
                                         for(j = 0; j < pt->parts; j++)
                                             offmatrix[j][0] = 0;
                                     }
 
                                 } else { /* !pt->type */
                                     if(pt->lsigid[0]) {
b7999b89
                                         rc = lsig_sub_matched(root, mdata, pt->lsigid[1], pt->lsigid[2], offmatrix[pt->parts - 1][1], 1);
                                         if (rc != CL_SUCCESS)
                                             return rc;
51ca644c
                                         ptN = ptN->next_same;
e772c090
                                         continue;
                                     }
 
                                     if(res) {
                                         newres = (struct cli_ac_result *) malloc(sizeof(struct cli_ac_result));
                                         if(!newres) {
                                             cli_errmsg("cli_ac_scanbuff: Can't allocate memory for newres %lu\n", (unsigned long)sizeof(struct cli_ac_result));
                                             return CL_EMEM;
                                         }
                                         newres->virname = pt->virname;
                                         newres->customdata = pt->customdata;
                                         newres->next = *res;
d0cba11e
                                         newres->offset = (off_t)offmatrix[pt->parts - 1][1];
e772c090
                                         *res = newres;
 
51ca644c
                                         ptN = ptN->next_same;
e772c090
                                         continue;
                                     } else {
d7979d4f
                                         if(ctx && SCAN_ALLMATCHES) {
e772c090
                                             cli_append_virus(ctx, (const char *)pt->virname);
                                             viruses_found = 1;
                                         }
                                         if (virname)
                                             *virname = pt->virname;
                                         if(customdata)
                                             *customdata = pt->customdata;
d7979d4f
                                         if (!ctx || !SCAN_ALLMATCHES)
e772c090
                                             return CL_VIRUS;
51ca644c
                                         ptN = ptN->next_same;
e772c090
                                         continue;
                                     }
                                 }
                             }
 
                         } else { /* old type signature */
                             if(pt->type) {
                                 if(pt->type == CL_TYPE_IGNORED && (!pt->rtype || ftype == pt->rtype))
                                     return CL_TYPE_IGNORED;
 
                                 if((pt->type > type || pt->type >= CL_TYPE_SFX || pt->type == CL_TYPE_MSEXE) && (!pt->rtype || ftype == pt->rtype)) {
 
                                     cli_dbgmsg("Matched signature for file type %s at %u\n", pt->virname, realoff);
                                     type = pt->type;
                                     if(ftoffset && (!*ftoffset || (*ftoffset)->cnt < MAX_EMBEDDED_OBJ || type == CL_TYPE_ZIPSFX) && (type == CL_TYPE_MBR || type >= CL_TYPE_SFX || ((ftype == CL_TYPE_MSEXE || ftype == CL_TYPE_ZIP || ftype == CL_TYPE_MSOLE2) && type == CL_TYPE_MSEXE)))  {
 
                                         if(ac_addtype(ftoffset, type, realoff, ctx))
                                             return CL_EMEM;
                                     }
                                 }
                             } else {
b7999b89
                                 if(pt->lsigid[0]) {
                                     rc = lsig_sub_matched(root, mdata, pt->lsigid[1], pt->lsigid[2], realoff, 0);
                                     if (rc != CL_SUCCESS)
                                         return rc;
51ca644c
                                     ptN = ptN->next_same;
e772c090
                                     continue;
                                 }
 
                                 if(res) {
                                     newres = (struct cli_ac_result *) malloc(sizeof(struct cli_ac_result));
                                     if(!newres) {
                                         cli_errmsg("cli_ac_scanbuff: Can't allocate memory for newres %lu\n", (unsigned long)sizeof(struct cli_ac_result));
                                         return CL_EMEM;
                                     }
                                     newres->virname = pt->virname;
                                     newres->customdata = pt->customdata;
d0cba11e
                                     newres->offset = (off_t)realoff;
e772c090
                                     newres->next = *res;
                                     *res = newres;
 
51ca644c
                                     ptN = ptN->next_same;
e772c090
                                     continue;
                                 } else {
d7979d4f
                                     if(ctx && SCAN_ALLMATCHES) {
e772c090
                                         cli_append_virus(ctx, (const char *)pt->virname);
                                         viruses_found = 1;
                                     }
 
                                     if (virname)
                                         *virname = pt->virname;
 
                                     if(customdata)
                                         *customdata = pt->customdata;
 
d7979d4f
                                     if (!ctx || !SCAN_ALLMATCHES)
e772c090
                                         return CL_VIRUS;
 
51ca644c
                                     ptN = ptN->next_same;
e772c090
                                     continue;
                                 }
                             }
                         }
51ca644c
                         ptN = ptN->next_same;
e772c090
                     }
                 }
51ca644c
                 pattN = pattN->next;
e772c090
             }
         }
8000d078
     }
 
aec1e3be
     if (viruses_found)
e772c090
         return CL_VIRUS;
 
6038397e
     return (mode & AC_SCAN_FT) ? type : CL_CLEAN;
8000d078
 }
fbcef1b0
 
cdd018d5
 static int qcompare_byte(const void *a, const void *b)
57e5af13
 {
bb1e844c
     return *(const unsigned char *)a - *(const unsigned char *)b;
57e5af13
 }
 
cdd018d5
 static int qcompare_fstr(const void *arg, const void *a, const void *b)
 {
     uint16_t len = *(uint16_t *)arg;
     return memcmp(*(const unsigned char **)a, *(const unsigned char **)b, len);
 }
 
2b512658
 /* returns if level of nesting, end set to MATCHING paren, start AFTER staring paren */
cc12e21d
 inline static size_t find_paren_end(char *hexstr, char **end)
2b512658
 {
cc12e21d
     size_t i;
     size_t nest = 0, level = 0;
2b512658
 
     *end = NULL;
     for (i = 0; i < strlen(hexstr); i++) {
9290ddf2
         if (hexstr[i] == '(') {
             nest++;
             level++;
         } else if (hexstr[i] == ')') {
             if (!level) {
                 *end = &hexstr[i];
                 break;
             }
             level--;
         }
2b512658
     }
 
     return nest;
 }
 
59506ff5
 /* analyzes expr, returns number of subexpr, if fixed length subexpr and longest subexpr len *
  * goes to either end of string or to closing parenthesis; allowed to be unbalanced          *
  * counts applied to start of expr (not end, i.e. numexpr starts at 1 for the first expr     */
 inline static int ac_analyze_expr(char *hexstr, int *fixed_len, int *sub_len)
2b512658
 {
d0cba11e
     unsigned long i;
     int level = 0, len = 0, numexpr = 1;
59506ff5
     int flen, slen;
2b512658
 
59506ff5
     flen = 1;
     slen = 0;
2b512658
     for (i = 0; i < strlen(hexstr); i++) {
9290ddf2
         if (hexstr[i] == '(') {
             flen = 0;
             level++;
         } else if (hexstr[i] == ')') {
             if (!level) {
                 if (!slen) {
                     slen = len;
                 } else if (len != slen) {
                     flen = 0;
                     if (len > slen)
                         slen = len;
                 }
                 break;
             }
             level--;
         }
         if (!level && hexstr[i] == '|') {
             if (!slen) {
                 slen = len;
             } else if (len != slen) {
                 flen = 0;
                 if (len > slen)
                     slen = len;
             }
             len = 0;
             numexpr++;
         } else {
dda6b057
             if (hexstr[i] == '?')
                 flen = 0;
9290ddf2
             len++;
         }
2b512658
     }
9ae2ec70
     if (!slen) {
9290ddf2
         slen = len;
9ae2ec70
     } else if (len != slen) {
         flen = 0;
         if (len > slen)
             slen = len;
     }
59506ff5
 
     if (sub_len)
9290ddf2
         *sub_len = slen;
59506ff5
     if (fixed_len)
9290ddf2
         *fixed_len = flen;
2b512658
 
     return numexpr;
 }
 
590d4023
 inline static int ac_uicmp(uint16_t *a, size_t alen, uint16_t *b, size_t blen, int *wild)
 {
d0cba11e
     uint16_t awild, bwild, side_wild;
590d4023
     size_t i, minlen = MIN(alen, blen);
 
     side_wild = 0;
 
     for (i = 0; i < minlen; i++) {
         awild = a[i] & CLI_MATCH_WILDCARD;
         bwild = b[i] & CLI_MATCH_WILDCARD;
 
         if (awild == bwild) {
             switch (awild) {
             case CLI_MATCH_CHAR:
                 if ((a[i] & 0xff) != (b[i] & 0xff)) {
                     return (b[i] & 0xff) - (a[i] & 0xff);
                 }
                 break;
             case CLI_MATCH_IGNORE:
                 break;
             case CLI_MATCH_NIBBLE_HIGH:
                 if ((a[i] & 0xf0) != (b[i] & 0xf0)) {
                     return (b[i] & 0xf0) - (a[i] & 0xf0);
                 }
                 break;
             case CLI_MATCH_NIBBLE_LOW:
                 if ((a[i] & 0x0f) != (b[i] & 0x0f)) {
                     return (b[i] & 0x0f) - (a[i] & 0x0f);
                 }
                 break;
             default:
                 cli_errmsg("ac_uicmp: unhandled wildcard type\n");
                 return 1;
             }
         } else { /* not identical wildcard types */
             if (awild == CLI_MATCH_CHAR) { /* b is only wild */
                 switch (bwild) {
                 case CLI_MATCH_IGNORE:
                     side_wild |= 2;
                     break;
                 case CLI_MATCH_NIBBLE_HIGH:
                     if ((a[i] & 0xf0) != (b[i] & 0xf0)) {
                         return (b[i] & 0xf0) - (a[i] & 0xff);
                     }
                     side_wild |= 2;
                     break;
                 case CLI_MATCH_NIBBLE_LOW:
                     if ((a[i] & 0x0f) != (b[i] & 0x0f)) {
                         return (b[i] & 0x0f) - (a[i] & 0xff);
                     }
                     side_wild |= 2;
                     break;
                 default:
                     cli_errmsg("ac_uicmp: unhandled wildcard type\n");
                     return -1;
                 }
             } else if (bwild == CLI_MATCH_CHAR) { /* a is only wild */
                 switch (awild) {
                 case CLI_MATCH_IGNORE:
                     side_wild |= 1;
                     break;
                 case CLI_MATCH_NIBBLE_HIGH:
                     if ((a[i] & 0xf0) != (b[i] & 0xf0)) {
                         return (b[i] & 0xff) - (a[i] & 0xf0);
                     }
                     side_wild |= 1;
dc716ccb
                     break;
590d4023
                 case CLI_MATCH_NIBBLE_LOW:
                     if ((a[i] & 0x0f) != (b[i] & 0x0f)) {
                         return (b[i] & 0xff) - (a[i] & 0x0f);
                     }
                     side_wild |= 1;
                     break;
                 default:
                     cli_errmsg("ac_uicmp: unhandled wild typing\n");
                     return 1;
                 }
             } else { /* not identical, both wildcards */
                 if (awild == CLI_MATCH_IGNORE || bwild == CLI_MATCH_IGNORE) {
                     if (awild == CLI_MATCH_IGNORE) {
                         side_wild |= 1;
                     }
                     else if (bwild == CLI_MATCH_IGNORE) {
                         side_wild |= 2;
                     }
                 } else {
                     /* only high and low nibbles should be left here */
                     side_wild |= 3;
                 }
             }
         }
 
         /* both sides contain a wildcard that contains the other, therefore unique by wildcards */
         if (side_wild == 3)
             return 1;
     }
 
     if (wild)
         *wild = side_wild;
     return 0;
 }
 
59506ff5
 /* add new generic alternate node to special */
d00f762f
 inline static int ac_addspecial_add_alt_node(const char *subexpr, uint8_t sigopts, struct cli_ac_special *special, struct cli_matcher *root)
2b512658
 {
59506ff5
     struct cli_alt_node *newnode, **prev, *ins;
dda6b057
     uint16_t *s;
590d4023
     int i, cmp, wild;
59506ff5
 
     newnode = (struct cli_alt_node *)mpool_calloc(root->mempool, 1, sizeof(struct cli_alt_node));
     if (!newnode) {
9290ddf2
         cli_errmsg("ac_addspecial_add_alt_node: Can't allocate new alternate node\n");
         return CL_EMEM;
59506ff5
     }
 
dda6b057
     s = cli_mpool_hex2ui(root->mempool, subexpr);
     if (!s) {
61530d4c
         mpool_free(root->mempool, newnode);
9290ddf2
         return CL_EMALFDB;
59506ff5
     }
 
dda6b057
     newnode->str = s;
8efbf4a0
     newnode->len = (uint16_t)strlen(subexpr)/2;
590d4023
     newnode->unique = 1;
59506ff5
 
d00f762f
     /* setting nocase match */
     if (sigopts & ACPATT_OPTION_NOCASE) {
         for (i = 0; i < newnode->len; ++i)
             if ((newnode->str[i] & CLI_MATCH_METADATA) == CLI_MATCH_CHAR) {
                 newnode->str[i] = cli_nocase(newnode->str[i] & 0xff);
                 newnode->str[i] += CLI_MATCH_NOCASE;
             }
     }
 
590d4023
     /* search for uniqueness, TODO: directed acyclic word graph */
59506ff5
     prev = &((special->alt).v_str);
     ins = (special->alt).v_str;
     while (ins) {
590d4023
         cmp = ac_uicmp(ins->str, ins->len, newnode->str, newnode->len, &wild);
4ffcf308
         if (cmp == 0) {
             if (newnode->len != ins->len) { /* derivative */
590d4023
                 newnode->unique = 0;
                 ins->unique = 0;
4ffcf308
             } else if (wild == 0) { /* duplicate */
590d4023
                 mpool_free(root->mempool, newnode);
9290ddf2
                 return CL_SUCCESS;
             }
590d4023
         } /* TODO - possible sorting of altstr uniques and derivative groups? */
 
9290ddf2
         prev = &(ins->next);
         ins = ins->next;
2b512658
     }
 
59506ff5
     *prev = newnode;
     newnode->next = ins;
b7d0b832
     if ((special->num == 0) || (newnode->len < special->len[0]))
         special->len[0] = newnode->len;
     if ((special->num == 0) || (newnode->len > special->len[1]))
         special->len[1] = newnode->len;
59506ff5
     special->num++;
     return CL_SUCCESS;
 }
2b512658
 
59506ff5
 /* recursive special handler for expanding and adding generic alternates */
d00f762f
 static int ac_special_altexpand(char *hexpr, char *subexpr, uint16_t maxlen, int lvl, int maxlvl, uint8_t sigopts, struct cli_ac_special *special, struct cli_matcher *root)
59506ff5
 {
     int ret, scnt = 0, numexpr;
     char *ept, *sexpr, *end, term;
     char *fp;
 
     ept = sexpr = hexpr;
     fp = subexpr + strlen(subexpr);
 
     numexpr = ac_analyze_expr(hexpr, NULL, NULL);
 
     /* while there are expressions to resolve */
     while (scnt < numexpr) {
9290ddf2
         scnt++;
         while ((*ept != '(') && (*ept != '|') && (*ept != ')') && (*ept != '\0'))
             ept++;
 
         /* check for invalid negation */
         term = *ept;
         if ((*ept == '(') && (ept >= hexpr+1)) {
             if (ept[-1] == '!') {
                 cli_errmsg("ac_special_altexpand: Generic alternates cannot contain negations\n");
                 return CL_EMALFDB;
             }
         }
 
         /* appended token */
         *ept = 0;
         if (cli_strlcat(subexpr, sexpr, maxlen) >= maxlen) {
             cli_errmsg("ac_special_altexpand: Unexpected expression larger than expected\n");
             return CL_EMEM;
         }
 
4ffcf308
         *ept++ = term;
9290ddf2
         sexpr = ept;
 
         if (term == '|') {
             if (lvl == 0) {
d00f762f
                 if ((ret = ac_addspecial_add_alt_node(subexpr, sigopts, special, root)) != CL_SUCCESS)
9290ddf2
                     return ret;
             } else {
                 find_paren_end(ept, &end);
                 if (!end) {
                     cli_errmsg("ac_special_altexpand: Missing closing parenthesis\n");
                     return CL_EMALFDB;
                 }
                 end++;
 
d00f762f
                 if ((ret = ac_special_altexpand(end, subexpr, maxlen, lvl-1, lvl, sigopts, special, root)) != CL_SUCCESS)
9290ddf2
                     return ret;
             }
 
             *fp = 0;
         } else if (term == ')') {
             if (lvl == 0) {
                 cli_errmsg("ac_special_altexpand: Unexpected closing parenthesis\n");
                 return CL_EPARSE;
             }
 
d00f762f
             if ((ret = ac_special_altexpand(ept, subexpr, maxlen, lvl-1, lvl, sigopts, special, root)) != CL_SUCCESS)
9290ddf2
                 return ret;
             break;
         } else if (term == '(') {
             int inner, found;
             find_paren_end(ept, &end);
             if (!end) {
                 cli_errmsg("ac_special_altexpand: Missing closing parenthesis\n");
                 return CL_EMALFDB;
             }
             end++;
 
d00f762f
             if ((ret = ac_special_altexpand(ept, subexpr, maxlen, lvl+1, lvl+1, sigopts, special, root)) != CL_SUCCESS)
9290ddf2
                 return ret;
 
4ffcf308
             /* move ept to end of current alternate expression (recursive call already populates them) */
9290ddf2
             ept = end;
             inner = 0;
             found = 0;
             while (!found && *ept != '\0') {
                 switch(*ept) {
                 case '|':
                     if (!inner)
                         found = 1;
                     break;
                 case '(':
                     inner++;
                     break;
                 case ')':
                     inner--;
                     break;
                 }
                 ept++;
             }
             if (*ept == '|')
                 ept++;
 
             sexpr = ept;
             *fp = 0;
         } else if (term == '\0') {
d00f762f
             if ((ret = ac_addspecial_add_alt_node(subexpr, sigopts, special, root)) != CL_SUCCESS)
9290ddf2
                 return ret;
             break;
         }
 
         if (lvl != maxlvl)
             return CL_SUCCESS;
2b512658
     }
59506ff5
     if (scnt != numexpr) {
9290ddf2
         cli_errmsg("ac_addspecial: Mismatch in parsed and expected signature\n");
         return CL_EMALFDB;
59506ff5
     }
2b512658
 
     return CL_SUCCESS;
 }
 
59506ff5
 /* alternate string specials (so many specials!) */
d00f762f
 inline static int ac_special_altstr(const char *hexpr, uint8_t sigopts, struct cli_ac_special *special, struct cli_matcher *root)
2b512658
 {
59506ff5
     char *hexprcpy, *h, *c;
     int i, ret, num, fixed, slen, len;
 
     if (!(hexprcpy = cli_strdup(hexpr))) {
9290ddf2
         cli_errmsg("ac_special_altstr: Can't duplicate alternate expression\n");
         return CL_EDUP;
2b512658
     }
 
59506ff5
     len = strlen(hexpr);
     num = ac_analyze_expr(hexprcpy, &fixed, &slen);
2b512658
 
d00f762f
     if (!sigopts && fixed) {
9290ddf2
         special->num = 0;
b7d0b832
         special->len[0] = special->len[1] = slen / 2;
9290ddf2
         /* single-bytes are len 2 in hex */
         if (slen == 2) {
             special->type = AC_SPECIAL_ALT_CHAR;
             (special->alt).byte = (unsigned char *) mpool_malloc(root->mempool, num);
             if (!((special->alt).byte)) {
                 cli_errmsg("cli_ac_special_altstr: Can't allocate newspecial->str\n");
                 free(hexprcpy);
                 return CL_EMEM;
             }
         } else {
             special->type = AC_SPECIAL_ALT_STR_FIXED;
10225c71
             (special->alt).f_str = (unsigned char **) mpool_malloc(root->mempool, num * sizeof(unsigned char *));
9290ddf2
             if (!((special->alt).f_str)) {
                 cli_errmsg("cli_ac_special_altstr: Can't allocate newspecial->str\n");
                 free(hexprcpy);
                 return CL_EMEM;
             }
         }
 
         for (i = 0; i < num; i++) {
             if (num == 1) {
7b1f1aaf
                 c = cli_mpool_hex2str(root->mempool, hexprcpy);
9290ddf2
             } else {
                 if(!(h = cli_strtok(hexprcpy, i, "|"))) {
                     free(hexprcpy);
                     return CL_EMEM;
                 }
7b1f1aaf
                 c = cli_mpool_hex2str(root->mempool, h);
9290ddf2
                 free(h);
             }
             if (!c) {
                 free(hexprcpy);
                 return CL_EMALFDB;
             }
 
             if (special->type == AC_SPECIAL_ALT_CHAR) {
7b1f1aaf
                 (special->alt).byte[i] = (unsigned char)*c;
9290ddf2
                 mpool_free(root->mempool, c);
             } else {
7b1f1aaf
                 (special->alt).f_str[i] = (unsigned char*)c;
9290ddf2
             }
             special->num++;
         }
         /* sorting byte alternates */
         if (special->num > 1 && special->type == AC_SPECIAL_ALT_CHAR)
cdd018d5
             cli_qsort((special->alt).byte, special->num, sizeof(unsigned char), qcompare_byte);
         /* sorting str alternates */
         if (special->num > 1 && special->type == AC_SPECIAL_ALT_STR_FIXED)
             cli_qsort_r((special->alt).f_str, special->num, sizeof(unsigned char *), qcompare_fstr, &(special->len));
59506ff5
     } else { /* generic alternates */
9290ddf2
         char *subexpr;
         if (special->negative) {
             cli_errmsg("ac_special_altstr: Can't apply negation operation to generic alternate strings\n");
             free(hexprcpy);
             return CL_EMALFDB;
         }
2b512658
 
9290ddf2
         special->type = AC_SPECIAL_ALT_STR;
2b512658
 
9290ddf2
         /* allocate reusable subexpr */
         if (!(subexpr = cli_calloc(slen+1, sizeof(char)))) {
             cli_errmsg("ac_special_altstr: Can't allocate subexpr container\n");
817636eb
             free(hexprcpy);
9290ddf2
             return CL_EMEM;
         }
2b512658
 
d00f762f
         ret = ac_special_altexpand(hexprcpy, subexpr, slen+1, 0, 0, sigopts, special, root);
59506ff5
 
9290ddf2
         free(subexpr);
         free(hexprcpy);
         return ret;
2b512658
     }
 
59506ff5
     free(hexprcpy);
2b512658
     return CL_SUCCESS;
 }
 
fbcef1b0
 /* FIXME: clean up the code */
dc70379a
 int cli_ac_addsig(struct cli_matcher *root, const char *virname, const char *hexsig, uint8_t sigopts, uint32_t sigid, uint16_t parts, uint16_t partno, uint16_t rtype, uint16_t type, uint32_t mindist, uint32_t maxdist, const char *offset, const uint32_t *lsigid, unsigned int options)
fbcef1b0
 {
bc1c7469
     struct cli_ac_patt *new;
     char *pt, *pt2, *hex = NULL, *hexcpy = NULL;
     uint16_t i, j, ppos = 0, pend, *dec, nzpos = 0;
dc70379a
     uint8_t wprefix = 0, zprefix = 1, plen = 0, nzplen = 0;
d0cba11e
     struct cli_ac_special *newspecial, **newtable;
bc1c7469
     int ret, error = CL_SUCCESS;
fbcef1b0
 
 
677fc4ba
     if(!root) {
bc1c7469
         cli_errmsg("cli_ac_addsig: root == NULL\n");
         return CL_ENULLARG;
677fc4ba
     }
 
871177cd
     if(strlen(hexsig) / 2 < root->ac_mindepth) {
bc1c7469
         cli_errmsg("cli_ac_addsig: Signature for %s is too short\n", virname);
         return CL_EMALFDB;
871177cd
     }
 
47d40feb
     if((new = (struct cli_ac_patt *) mpool_calloc(root->mempool, 1, sizeof(struct cli_ac_patt))) == NULL)
bc1c7469
         return CL_EMEM;
fbcef1b0
 
6038397e
     new->rtype = rtype;
fbcef1b0
     new->type = type;
     new->sigid = sigid;
     new->parts = parts;
     new->partno = partno;
     new->mindist = mindist;
     new->maxdist = maxdist;
10290ba3
     new->customdata = NULL;
1a2906f4
     new->ch[0] |= CLI_MATCH_IGNORE;
     new->ch[1] |= CLI_MATCH_IGNORE;
677fc4ba
     if(lsigid) {
bc1c7469
         new->lsigid[0] = 1;
         memcpy(&new->lsigid[1], lsigid, 2 * sizeof(uint32_t));
677fc4ba
     }
1a2906f4
 
     if(strchr(hexsig, '[')) {
bc1c7469
         if(!(hexcpy = cli_strdup(hexsig))) {
             mpool_free(root->mempool, new);
             return CL_EMEM;
         }
1a2906f4
 
bc1c7469
         hex = hexcpy;
         for(i = 0; i < 2; i++) {
82cc35c0
             unsigned int n, n1, n2;
1a2906f4
 
bc1c7469
             if(!(pt = strchr(hex, '[')))
                 break;
1a2906f4
 
bc1c7469
             *pt++ = 0;
1a2906f4
 
bc1c7469
             if(!(pt2 = strchr(pt, ']'))) {
                 cli_dbgmsg("cli_ac_addsig: missing closing square bracket\n");
                 error = CL_EMALFDB;
                 break;
             }
1a2906f4
 
bc1c7469
             *pt2++ = 0;
1a2906f4
 
82cc35c0
             n = sscanf(pt, "%u-%u", &n1, &n2);
             if(n == 1) {
                 n2 = n1;
             } else if(n != 2) {
bc1c7469
                 cli_dbgmsg("cli_ac_addsig: incorrect range inside square brackets\n");
                 error = CL_EMALFDB;
                 break;
             }
 
             if((n1 > n2) || (n2 > AC_CH_MAXDIST)) {
                 cli_dbgmsg("cli_ac_addsig: incorrect range inside square brackets\n");
                 error = CL_EMALFDB;
                 break;
             }
 
             if(strlen(hex) == 2) {
                 if(i) {
                     error = CL_EMALFDB;
                     break;
                 }
 
                 dec = cli_hex2ui(hex);
                 if(!dec) {
                     error = CL_EMALFDB;
                     break;
                 }
 
dc70379a
                 if((sigopts & ACPATT_OPTION_NOCASE) && ((*dec & CLI_MATCH_METADATA) == CLI_MATCH_CHAR))
a1924d14
                     new->ch[i] = cli_nocase(*dec) | CLI_MATCH_NOCASE;
                 else
                     new->ch[i] = *dec;
bc1c7469
                 free(dec);
                 new->ch_mindist[i] = n1;
                 new->ch_maxdist[i] = n2;
                 hex = pt2;
             } else if(strlen(pt2) == 2) {
                 i = 1;
                 dec = cli_hex2ui(pt2);
                 if(!dec) {
                     error = CL_EMALFDB;
                     break;
                 }
 
dc70379a
                 if((sigopts & ACPATT_OPTION_NOCASE) && ((*dec & CLI_MATCH_METADATA) == CLI_MATCH_CHAR))
a1924d14
                     new->ch[i] = cli_nocase(*dec) | CLI_MATCH_NOCASE;
                 else
                     new->ch[i] = *dec;
bc1c7469
                 free(dec);
                 new->ch_mindist[i] = n1;
                 new->ch_maxdist[i] = n2;
             } else {
                 error = CL_EMALFDB;
                 break;
             }
         }
 
         if(error) {
             free(hexcpy);
             mpool_free(root->mempool, new);
             return error;
         }
 
         hex = cli_strdup(hex);
         free(hexcpy);
         if(!hex) {
             mpool_free(root->mempool, new);
             return CL_EMEM;
         }
1a2906f4
     }
fbcef1b0
 
     if(strchr(hexsig, '(')) {
9290ddf2
         char *hexnew, *start;
cc12e21d
         size_t nest;
9290ddf2
         size_t hexnewsz;
 
         if(hex) {
             hexcpy = hex;
         } else if(!(hexcpy = cli_strdup(hexsig))) {
             mpool_free(root->mempool, new);
             return CL_EMEM;
         }
 
         hexnewsz = strlen(hexsig) + 1;
         if(!(hexnew = (char *) cli_calloc(1, hexnewsz))) {
             free(new);
             free(hexcpy);
             return CL_EMEM;
         }
 
         start = pt = hexcpy;
         while((pt = strchr(start, '('))) {
             *pt++ = 0;
 
             if(!start) {
                 error = CL_EMALFDB;
                 break;
             }
             newspecial = (struct cli_ac_special *) mpool_calloc(root->mempool, 1, sizeof(struct cli_ac_special));
             if(!newspecial) {
                 cli_errmsg("cli_ac_addsig: Can't allocate newspecial\n");
                 error = CL_EMEM;
                 break;
             }
             if(pt >= hexcpy + 2) {
                 if(pt[-2] == '!') {
                     newspecial->negative = 1;
                     pt[-2] = 0;
                 }
             }
             cli_strlcat(hexnew, start, hexnewsz);
 
             nest = find_paren_end(pt, &start);
             if(!start) {
                 cli_errmsg("cli_ac_addsig: Missing closing parenthesis\n");
                 mpool_free(root->mempool, newspecial);
                 error = CL_EMALFDB;
                 break;
             }
             *start++ = 0;
             if(!strlen(pt)) {
                 cli_errmsg("cli_ac_addsig: Empty block\n");
                 mpool_free(root->mempool, newspecial);
                 error = CL_EMALFDB;
                 break;
             }
 
4ffcf308
             if (nest > ACPATT_ALTN_MAXNEST) {
                 cli_errmsg("ac_addspecial: Expression exceeds maximum alternate nesting limit\n");
0f236303
                 mpool_free(root->mempool, newspecial);
                 error = CL_EMALFDB;
                 break;
9290ddf2
             }
 
             if(!strcmp(pt, "B")) {
                 if(!*start) {
                     new->boundary |= AC_BOUNDARY_RIGHT;
                     if(newspecial->negative)
                         new->boundary |= AC_BOUNDARY_RIGHT_NEGATIVE;
                     mpool_free(root->mempool, newspecial);
                     continue;
                 } else if(pt - 1 == hexcpy) {
                     new->boundary |= AC_BOUNDARY_LEFT;
                     if(newspecial->negative)
                         new->boundary |= AC_BOUNDARY_LEFT_NEGATIVE;
                     mpool_free(root->mempool, newspecial);
                     continue;
                 }
             } else if(!strcmp(pt, "L")) {
                 if(!*start) {
                     new->boundary |= AC_LINE_MARKER_RIGHT;
                     if(newspecial->negative)
                         new->boundary |= AC_LINE_MARKER_RIGHT_NEGATIVE;
                     mpool_free(root->mempool, newspecial);
                     continue;
                 } else if(pt - 1 == hexcpy) {
                     new->boundary |= AC_LINE_MARKER_LEFT;
                     if(newspecial->negative)
                         new->boundary |= AC_LINE_MARKER_LEFT_NEGATIVE;
                     mpool_free(root->mempool, newspecial);
                     continue;
                 }
             } else if(!strcmp(pt, "W")) {
                 if(!*start) {
                     new->boundary |= AC_WORD_MARKER_RIGHT;
                     if(newspecial->negative)
                         new->boundary |= AC_WORD_MARKER_RIGHT_NEGATIVE;
                     mpool_free(root->mempool, newspecial);
                     continue;
                 } else if(pt - 1 == hexcpy) {
                     new->boundary |= AC_WORD_MARKER_LEFT;
                     if(newspecial->negative)
                         new->boundary |= AC_WORD_MARKER_LEFT_NEGATIVE;
                     mpool_free(root->mempool, newspecial);
                     continue;
                 }
             }
             cli_strlcat(hexnew, "()", hexnewsz);
             new->special++;
             newtable = (struct cli_ac_special **) mpool_realloc(root->mempool, new->special_table, new->special * sizeof(struct cli_ac_special *));
             if(!newtable) {
                 new->special--;
                 mpool_free(root->mempool, newspecial);
                 cli_errmsg("cli_ac_addsig: Can't realloc new->special_table\n");
                 error = CL_EMEM;
                 break;
             }
             newtable[new->special - 1] = newspecial;
             new->special_table = newtable;
 
             if(!strcmp(pt, "B")) {
                 newspecial->type = AC_SPECIAL_BOUNDARY;
             } else if(!strcmp(pt, "L")) {
                 newspecial->type = AC_SPECIAL_LINE_MARKER;
             } else if(!strcmp(pt, "W")) {
                 newspecial->type = AC_SPECIAL_WORD_MARKER;
             } else {
d00f762f
                 if ((ret = ac_special_altstr(pt, sigopts, newspecial, root)) != CL_SUCCESS) {
9290ddf2
                     error = ret;
                     break;
                 }
             }
         }
 
         if(start)
             cli_strlcat(hexnew, start, hexnewsz);
 
         hex = hexnew;
         free(hexcpy);
 
         if(error) {
             free(hex);
             if(new->special) {
                 mpool_ac_free_special(root->mempool, new);
             }
             mpool_free(root->mempool, new);
             return error;
         }
fbcef1b0
     }
 
47d40feb
     new->pattern = cli_mpool_hex2ui(root->mempool, hex ? hex : hexsig);
b94e66c4
     if(new->pattern == NULL) {
bc1c7469
         if(new->special)
             mpool_ac_free_special(root->mempool, new);
 
         mpool_free(root->mempool, new);
         free(hex);
         return CL_EMALFDB;
fbcef1b0
     }
b94e66c4
 
8efbf4a0
     new->length[0] = (uint16_t)strlen(hex ? hex : hexsig) / 2;
6953341f
     for(i = 0, j = 0; i < new->length[0]; i++) {
         if((new->pattern[i] & CLI_MATCH_METADATA) == CLI_MATCH_SPECIAL) {
             new->length[1] += new->special_table[j]->len[0];
             new->length[2] += new->special_table[j]->len[1];
             j++;
         } else {
             new->length[1]++;
             new->length[2]++;
         }
     }
 
1a2906f4
     free(hex);
fbcef1b0
 
dc70379a
     new->sigopts = sigopts;
68369b0f
     /* setting nocase match */
dc70379a
     if (sigopts & ACPATT_OPTION_NOCASE) {
6953341f
         for (i = 0; i < new->length[0]; i++)
9290ddf2
             if ((new->pattern[i] & CLI_MATCH_METADATA) == CLI_MATCH_CHAR) {
                 new->pattern[i] = cli_nocase(new->pattern[i] & 0xff);
                 new->pattern[i] += CLI_MATCH_NOCASE;
             }
a02acd50
     }
 
4ffcf308
     /* TODO - sigopts affect on filters? */
     if (root->filter) {
bc1c7469
         /* so that we can show meaningful messages */
         new->virname = (char*)virname;
         if (filter_add_acpatt(root->filter, new) == -1) {
             cli_warnmsg("cli_ac_addpatt: cannot use filter for trie\n");
             mpool_free(root->mempool, root->filter);
             root->filter = NULL;
         }
 
         /* TODO: should this affect maxpatlen? */
02eabc6d
     }
 
f2102544
     for(i = 0; i < root->ac_maxdepth && i < new->length[0]; i++) {
bc1c7469
         if(new->pattern[i] & CLI_MATCH_WILDCARD) {
             wprefix = 1;
             break;
         }
 
         if(zprefix && new->pattern[i])
             zprefix = 0;
fbcef1b0
     }
 
c01ff22d
     if(wprefix || zprefix) {
f2102544
         pend = new->length[0] - root->ac_mindepth + 1;
bc1c7469
         for(i = 0; i < pend; i++) {
f2102544
             for(j = i; j < i + root->ac_maxdepth && j < new->length[0]; j++) {
bc1c7469
                 if(new->pattern[j] & CLI_MATCH_WILDCARD) {
                     break;
                 } else {
                     if(j - i + 1 >= plen) {
                         plen = j - i + 1;
                         ppos = i;
                     }
                 }
 
                 if(new->pattern[ppos] || new->pattern[ppos + 1]) {
                     if(plen >= root->ac_maxdepth) {
                         break;
                     } else if(plen >= root->ac_mindepth && plen > nzplen) {
                         nzplen = plen;
                         nzpos = ppos;
                     }
                 }
             }
fbcef1b0
 
bc1c7469
             if(plen >= root->ac_maxdepth && (new->pattern[ppos] || new->pattern[ppos + 1]))
                 break;
         }
 
         if(!new->pattern[ppos] && !new->pattern[ppos + 1] && nzplen) {
             plen = nzplen;
             ppos = nzpos;
         }
 
         if(plen < root->ac_mindepth) {
             cli_errmsg("cli_ac_addsig: Can't find a static subpattern of length %u\n", root->ac_mindepth);
             mpool_ac_free_special(root->mempool, new);
             mpool_free(root->mempool, new->pattern);
             mpool_free(root->mempool, new);
             return CL_EMALFDB;
         }
fbcef1b0
 
bc1c7469
         new->prefix = new->pattern;
f2102544
         new->prefix_length[0] = ppos;
6953341f
         for(i = 0, j = 0; i < new->prefix_length[0]; i++) {
bc1c7469
             if((new->prefix[i] & CLI_MATCH_WILDCARD) == CLI_MATCH_SPECIAL)
                 new->special_pattern++;
6953341f
 
             if((new->prefix[i] & CLI_MATCH_METADATA) == CLI_MATCH_SPECIAL) {
                 new->prefix_length[1] += new->special_table[j]->len[0];
                 new->prefix_length[2] += new->special_table[j]->len[1];
                 j++;
             } else {
                 new->prefix_length[1]++;
                 new->prefix_length[2]++;
             }
         }
 
         new->pattern = &new->prefix[ppos];
         new->length[0] -= new->prefix_length[0];
         new->length[1] -= new->prefix_length[1];
         new->length[2] -= new->prefix_length[2];
fbcef1b0
     }
 
600c04f0
     if(new->length[2] + new->prefix_length[2] > root->maxpatlen)
         root->maxpatlen = new->length[2] + new->prefix_length[2];
fbcef1b0
 
bb1e844c
     new->virname = cli_mpool_virname(root->mempool, virname, options & CL_DB_OFFICIAL);
b5513f8d
     if(!new->virname) {
bc1c7469
         mpool_free(root->mempool, new->prefix ? new->prefix : new->pattern);
         mpool_ac_free_special(root->mempool, new);
         mpool_free(root->mempool, new);
         return CL_EMEM;
fbcef1b0
     }
 
677fc4ba
     if(new->lsigid[0])
bc1c7469
         root->ac_lsigtable[new->lsigid[1]]->virname = new->virname;
677fc4ba
 
294558a5
     ret = cli_caloff(offset, NULL, root->type, new->offdata, &new->offset_min, &new->offset_max);
33872a43
     if(ret != CL_SUCCESS) {
bc1c7469
         mpool_free(root->mempool, new->prefix ? new->prefix : new->pattern);
         mpool_ac_free_special(root->mempool, new);
         mpool_free(root->mempool, new->virname);
         mpool_free(root->mempool, new);
         return ret;
1a648b37
     }
 
fbcef1b0
     if((ret = cli_ac_addpatt(root, new))) {
bc1c7469
         mpool_free(root->mempool, new->prefix ? new->prefix : new->pattern);
         mpool_free(root->mempool, new->virname);
         mpool_ac_free_special(root->mempool, new);
         mpool_free(root->mempool, new);
         return ret;
fbcef1b0
     }
 
ab893605
     if(new->offdata[0] != CLI_OFF_ANY && new->offdata[0] != CLI_OFF_ABSOLUTE && new->offdata[0] != CLI_OFF_MACRO) {
bc1c7469
         root->ac_reloff = (struct cli_ac_patt **) mpool_realloc2(root->mempool, root->ac_reloff, (root->ac_reloff_num + 1) * sizeof(struct cli_ac_patt *));
         if(!root->ac_reloff) {
             cli_errmsg("cli_ac_addsig: Can't allocate memory for root->ac_reloff\n");
             return CL_EMEM;
         }
 
         root->ac_reloff[root->ac_reloff_num] = new;
         new->offset_min = root->ac_reloff_num * 2;
         new->offset_max = new->offset_min + 1;
         root->ac_reloff_num++;
33872a43
     }
 
fbcef1b0
     return CL_SUCCESS;
 }