/* * Generic text normalizer. * * Copyright (C) 2013-2019 Cisco Systems, Inc. and/or its affiliates. All rights reserved. * Copyright (C) 2008-2013 Sourcefire, Inc. * * Authors: Török Edvin * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License version 2 as * published by the Free Software Foundation. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, * MA 02110-1301, USA. */ #ifndef __TEXTNORM_H #define __TEXTNORM_H #include "fmap.h" struct text_norm_state { unsigned char *out; size_t out_len; size_t out_pos; int space_written; }; #define ASCII_FILE_BUFF_LENGTH 131072 #define MAX_ASCII_FILE_SIZE 20000000 #define MIN_3(x, y, z) ((x) < (y) ? ((x) < (z) ? (x) : (z)) : ((y) < (z) ? (y) : (z))) int text_normalize_init(struct text_norm_state *state, unsigned char *out, size_t out_len); void text_normalize_reset(struct text_norm_state *state); size_t text_normalize_buffer(struct text_norm_state *state, const unsigned char *buf, const size_t buf_len); size_t text_normalize_map(struct text_norm_state *state, fmap_t *map, size_t offset); #endif