libclamav/matcher.h
e3aaff8e
 /*
e1cbc270
  *  Copyright (C) 2013-2019 Cisco Systems, Inc. and/or its affiliates. All rights reserved.
c1206103
  *  Copyright (C) 2007-2013 Sourcefire, Inc.
4addba22
  *
2023340a
  *  Authors: Tomasz Kojm
e3aaff8e
  *
  *  This program is free software; you can redistribute it and/or modify
bb34cb31
  *  it under the terms of the GNU General Public License version 2 as
  *  published by the Free Software Foundation.
e3aaff8e
  *
  *  This program is distributed in the hope that it will be useful,
  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  *  GNU General Public License for more details.
  *
  *  You should have received a copy of the GNU General Public License
  *  along with this program; if not, write to the Free Software
48b7b4a7
  *  Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
  *  MA 02110-1301, USA.
e3aaff8e
  */
 
 #ifndef __MATCHER_H
 #define __MATCHER_H
 
841161e0
 #include <sys/types.h>
 
e3aaff8e
 #include "clamav.h"
a85bd2ac
 #include "filetypes.h"
3c91998b
 #include "others.h"
841161e0
 #include "execs.h"
e3aaff8e
 
294558a5
 struct cli_target_info {
     off_t fsize;
     struct cli_exe_info exeinfo;
     int status; /* 0 == not initialised, 1 == initialised OK, -1 == error */
 };
 
afe940da
 void cli_targetinfo_init(struct cli_target_info *info);
 void cli_targetinfo_destroy(struct cli_target_info *info);
 
bedc58de
 #include "matcher-ac.h"
 #include "matcher-bm.h"
c802edd5
 #include "matcher-hash.h"
5fa73369
 #include "matcher-pcre.h"
1d859d1c
 #include "matcher-byte-comp.h"
5fa73369
 #include "regex_pcre.h"
048d7677
 #include "fmap.h"
b94e66c4
 #include "mpool.h"
 
27948a03
 // clang-format off
 
 #define CLI_MATCH_METADATA    0xff00
 #define CLI_MATCH_WILDCARD    0x0f00
 #define CLI_MATCH_CHAR        0x0000
 #define CLI_MATCH_NOCASE      0x1000
 #define CLI_MATCH_IGNORE      0x0100
 #define CLI_MATCH_SPECIAL     0x0200
 #define CLI_MATCH_NIBBLE_HIGH 0x0300
 #define CLI_MATCH_NIBBLE_LOW  0x0400
 
 #define CLI_TDB_UINT        0
 #define CLI_TDB_RANGE       1
 #define CLI_TDB_STR         2
 #define CLI_TDB_RANGE2      3
 #define CLI_TDB_FTYPE       4
 #define CLI_TDB_FTYPE_EXPR  5
bedc58de
 
677fc4ba
 struct cli_lsig_tdb {
27948a03
     uint32_t       *val, *range;
     char           *str;
     uint32_t       cnt[3];
     uint32_t       subsigs;
677fc4ba
 
     const uint32_t *target;
17cfd76f
     const uint32_t *engine, *nos, *ep, *filesize;
7770d314
     const uint32_t *container, *handlertype;
87b2a1a9
     const uint32_t *intermediates;
0f7ba617
     /*
677fc4ba
     const uint32_t *sectoff, *sectrva, *sectvsz, *sectraw, *sectrsz,
27948a03
                    *secturva, *sectuvsz, *secturaw, *sectursz;
0f7ba617
     */
27948a03
     const char     *icongrp1, *icongrp2;
     uint32_t       *macro_ptids;
0d9dbdef
 #ifdef USE_MPOOL
27948a03
     mpool_t        *mempool;
0d9dbdef
 #endif
677fc4ba
 };
 
27948a03
 // clang-format on
 
7665e02d
 #define CLI_LSIG_FLAG_PRIVATE 0x01
 
459b13ed
 struct cli_bc;
677fc4ba
 struct cli_ac_lsig {
b7999b89
 #define CLI_LSIG_NORMAL 0
 #define CLI_YARA_NORMAL 1
 #define CLI_YARA_OFFSET 2
677fc4ba
     uint32_t id;
2545f976
     unsigned bc_idx;
b5b3fecd
     uint8_t type;
7665e02d
     uint8_t flag;
b5b3fecd
     union {
         char *logic;
f51f42e9
         uint8_t *code_start;
b5b3fecd
     } u;
677fc4ba
     const char *virname;
     struct cli_lsig_tdb tdb;
 };
 
bedc58de
 struct cli_matcher {
33872a43
     unsigned int type;
 
bedc58de
     /* Extended Boyer-Moore */
ab1db3b3
     uint8_t *bm_shift;
006f5fe6
     struct cli_bm_patt **bm_suffix, **bm_pattab;
0a3d4094
     uint32_t *soff, soff_len; /* for PE section sigs */
006f5fe6
     uint32_t bm_offmode, bm_patterns, bm_reloff_num, bm_absoff_num;
bedc58de
 
3faa9783
     /* HASH */
c802edd5
     struct cli_hash_patt hm;
e37613ad
     struct cli_hash_wild hwild;
c802edd5
 
bedc58de
     /* Extended Aho-Corasick */
3e265c46
     uint32_t ac_partsigs, ac_nodes, ac_lists, ac_patterns, ac_lsigs;
677fc4ba
     struct cli_ac_lsig **ac_lsigtable;
bedc58de
     struct cli_ac_node *ac_root, **ac_nodetable;
3e265c46
     struct cli_ac_list **ac_listtable;
fbcef1b0
     struct cli_ac_patt **ac_pattable;
33872a43
     struct cli_ac_patt **ac_reloff;
aca9ea82
     uint32_t ac_reloff_num, ac_absoff_num;
b5231f5f
     uint8_t ac_mindepth, ac_maxdepth;
02eabc6d
     struct filter *filter;
b5231f5f
 
     uint16_t maxpatlen;
23d7c6e6
     uint8_t ac_only;
5fa73369
 
     /* Perl-Compiled Regular Expressions */
7afaa9bd
 #if HAVE_PCRE
35a05ff8
     uint32_t pcre_metas;
     struct cli_pcre_meta **pcre_metatable;
7ab4eec7
     uint32_t pcre_reloff_num, pcre_absoff_num;
7afaa9bd
 #endif
5fa73369
 
9cb3e8eb
     /* Byte Compare */
     uint32_t bcomp_metas;
     struct cli_bcomp_meta **bcomp_metatable;
 
984f90ca
     /* Bytecode Tracker */
     uint32_t linked_bcs;
 
0728972e
 #ifdef USE_MPOOL
47d40feb
     mpool_t *mempool;
0728972e
 #endif
bedc58de
 };
 
288057e9
 struct cli_cdb {
     char *virname;           /* virus name */
     cli_file_t ctype;        /* container type */
     regex_t name;            /* filename regex */
     size_t csize[2];         /* container size (min, max); if csize[0] != csize[1]
d0cba11e
 			                     * then value of 0 makes the field ignored
 			                     */
288057e9
     size_t fsizec[2];        /* file size in container */
     size_t fsizer[2];        /* real file size */
     int encrypted;           /* file is encrypted; 2 == ignore */
     unsigned int filepos[2]; /* file position in container */
     int res1;                /* reserved / format specific */
     void *res2;              /* reserved / format specific */
55094a9c
 
     struct cli_cdb *next;
 };
 
2c0fa85f
 #define CLI_MAX_TARGETS 2 /* maximum filetypes for a specific target */
4addba22
 struct cli_mtarget {
2c0fa85f
     cli_file_t target[CLI_MAX_TARGETS];
4addba22
     const char *name;
288057e9
     uint8_t idx; /* idx of matcher */
4addba22
     uint8_t ac_only;
02eabc6d
     uint8_t enable_prefiltering;
2c0fa85f
     uint8_t target_count; /* must be synced with non-zero values in the target array */
4addba22
 };
 
27948a03
 // clang-format off
 
e7b3198d
 #define CLI_MTARGETS 15
4addba22
 static const struct cli_mtarget cli_mtargets[CLI_MTARGETS] =  {
2c0fa85f
     { {0, 0},                                   "GENERIC",      0,  0, 1, 1 },
     { {CL_TYPE_MSEXE, 0},                       "PE",           1,  0, 1, 1 },
     { {CL_TYPE_MSOLE2, 0},                      "OLE2",         2,  1, 0, 1 },
     { {CL_TYPE_HTML, 0},                        "HTML",         3,  1, 0, 1 },
     { {CL_TYPE_MAIL, 0},                        "MAIL",         4,  1, 1, 1 },
     { {CL_TYPE_GRAPHICS, 0},                    "GRAPHICS",     5,  1, 0, 1 },
     { {CL_TYPE_ELF, 0},                         "ELF",          6,  1, 0, 1 },
     { {CL_TYPE_TEXT_ASCII, 0},                  "ASCII",        7,  1, 1, 1 },
     { {CL_TYPE_ERROR, 0},                       "NOT USED",     8,  1, 0, 1 },
     { {CL_TYPE_MACHO, CL_TYPE_MACHO_UNIBIN},    "MACH-O",       9,  1, 0, 2 },
     { {CL_TYPE_PDF, 0},                         "PDF",         10,  1, 0, 1 },
     { {CL_TYPE_SWF, 0},                         "FLASH",       11,  1, 0, 1 },
de46d3e3
     { {CL_TYPE_JAVA, 0},                        "JAVA",        12,  1, 0, 1 },
e7b3198d
     { {CL_TYPE_INTERNAL, 0},                    "INTERNAL",    13,  1, 0, 1 },
     { {CL_TYPE_OTHER, 0},                       "OTHER",       14,  1, 0, 1 }
4addba22
 };
b68d11d2
 
33872a43
 #define CLI_OFF_ANY         0xffffffff
27948a03
 #define CLI_OFF_NONE        0xfffffffe
33872a43
 #define CLI_OFF_ABSOLUTE    1
 #define CLI_OFF_EOF_MINUS   2
 #define CLI_OFF_EP_PLUS     3
 #define CLI_OFF_EP_MINUS    4
 #define CLI_OFF_SL_PLUS     5
 #define CLI_OFF_SX_PLUS     6
d2ba6f98
 #define CLI_OFF_VERSION     7
ab893605
 #define CLI_OFF_MACRO       8
27948a03
 #define CLI_OFF_SE          9
 
 // clang-format on
33872a43
 
102cd430
 cl_error_t cli_scanbuff(const unsigned char *buffer, uint32_t length, uint32_t offset, cli_ctx *ctx, cli_file_t ftype, struct cli_ac_data **acdata);
5612732c
 
102cd430
 cl_error_t cli_scandesc(int desc, cli_ctx *ctx, cli_file_t ftype, uint8_t ftonly, struct cli_matched_type **ftoffset, unsigned int acmode, struct cli_ac_result **acres);
 cl_error_t cli_fmap_scandesc(cli_ctx *ctx, cli_file_t ftype, uint8_t ftonly, struct cli_matched_type **ftoffset, unsigned int acmode, struct cli_ac_result **acres, unsigned char *refhash);
 cl_error_t cli_exp_eval(cli_ctx *ctx, struct cli_matcher *root, struct cli_ac_data *acdata, struct cli_target_info *target_info, const char *hash);
 cl_error_t cli_caloff(const char *offstr, const struct cli_target_info *info, unsigned int target, uint32_t *offdata, uint32_t *offset_min, uint32_t *offset_max);
53721687
 
102cd430
 cl_error_t cli_checkfp(unsigned char *digest, size_t size, cli_ctx *ctx);
 cl_error_t cli_checkfp_virus(unsigned char *digest, size_t size, cli_ctx *ctx, const char *vname);
e4101980
 
102cd430
 cl_error_t cli_matchmeta(cli_ctx *ctx, const char *fname, size_t fsizec, size_t fsizer, int encrypted, unsigned int filepos, int res1, void *res2);
55094a9c
 
c1206103
 void cli_targetinfo(struct cli_target_info *info, unsigned int target, fmap_t *map);
 
e3aaff8e
 #endif