blob: 37aa98ac423bf636332d87174cf84c6686c46812 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
|
/*
** Case-sensitive Boyer-Moore-Horspool pattern match
**
** public domain by Raymond Gardner 7/92
**
** limitation: pattern length + string length must be less than 32767
**
** 10/21/93 rdg Fixed bug found by Jeff Dunlop
*/
#include <limits.h> /* rdg 10/93 */
#include <stddef.h>
#include <string.h>
typedef unsigned char uchar;
#define LARGE 32767
static int patlen;
static int skip[UCHAR_MAX+1]; /* rdg 10/93 */
static int skip2;
static uchar *pat;
void bmh_init(const char *pattern)
{
int i, lastpatchar;
pat = (uchar *)pattern;
patlen = strlen(pattern);
for (i = 0; i <= UCHAR_MAX; ++i) /* rdg 10/93 */
skip[i] = patlen;
for (i = 0; i < patlen; ++i)
skip[pat[i]] = patlen - i - 1;
lastpatchar = pat[patlen - 1];
skip[lastpatchar] = LARGE;
skip2 = patlen; /* Horspool's fixed second shift */
for (i = 0; i < patlen - 1; ++i)
{
if (pat[i] == lastpatchar)
skip2 = patlen - i - 1;
}
}
char *bmh_search(const char *string, const int stringlen)
{
int i, j;
char *s;
i = patlen - 1 - stringlen;
if (i >= 0)
return NULL;
string += stringlen;
for ( ;; )
{
while ( (i += skip[((uchar *)string)[i]]) < 0 )
; /* mighty fast inner loop */
if (i < (LARGE - stringlen))
return NULL;
i -= LARGE;
j = patlen - 1;
s = (char *)string + (i - j);
while (--j >= 0 && s[j] == pat[j])
;
if ( j < 0 ) /* rdg 10/93 */
return s; /* rdg 10/93 */
if ( (i += skip2) >= 0 ) /* rdg 10/93 */
return NULL; /* rdg 10/93 */
}
}
|