47 lines
1.5 KiB
C
47 lines
1.5 KiB
C
|
/*
|
||
|
* Generic text normalizer.
|
||
|
*
|
||
|
* Copyright (C) 2013-2022 Cisco Systems, Inc. and/or its affiliates. All rights reserved.
|
||
|
* Copyright (C) 2008-2013 Sourcefire, Inc.
|
||
|
*
|
||
|
* Authors: Török Edvin
|
||
|
*
|
||
|
* This program is free software; you can redistribute it and/or modify
|
||
|
* it under the terms of the GNU General Public License version 2 as
|
||
|
* published by the Free Software Foundation.
|
||
|
*
|
||
|
* This program is distributed in the hope that it will be useful,
|
||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
* GNU General Public License for more details.
|
||
|
*
|
||
|
* You should have received a copy of the GNU General Public License
|
||
|
* along with this program; if not, write to the Free Software
|
||
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
|
||
|
* MA 02110-1301, USA.
|
||
|
*/
|
||
|
|
||
|
#ifndef __TEXTNORM_H
|
||
|
#define __TEXTNORM_H
|
||
|
|
||
|
#include "fmap.h"
|
||
|
|
||
|
struct text_norm_state {
|
||
|
unsigned char *out;
|
||
|
size_t out_len;
|
||
|
size_t out_pos;
|
||
|
int space_written;
|
||
|
};
|
||
|
|
||
|
#define ASCII_FILE_BUFF_LENGTH 131072
|
||
|
#define MAX_ASCII_FILE_SIZE 20000000
|
||
|
|
||
|
#define MIN_3(x, y, z) ((x) < (y) ? ((x) < (z) ? (x) : (z)) : ((y) < (z) ? (y) : (z)))
|
||
|
|
||
|
int text_normalize_init(struct text_norm_state *state, unsigned char *out, size_t out_len);
|
||
|
void text_normalize_reset(struct text_norm_state *state);
|
||
|
size_t text_normalize_buffer(struct text_norm_state *state, const unsigned char *buf, const size_t buf_len);
|
||
|
size_t text_normalize_map(struct text_norm_state *state, fmap_t *map, size_t offset);
|
||
|
|
||
|
#endif
|