-
Notifications
You must be signed in to change notification settings - Fork 3
/
fa_sim_bitcomp.c
175 lines (137 loc) · 4.47 KB
/
fa_sim_bitcomp.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
//
// Copyright (c) 2015 Waystream AB
// All rights reserved.
//
// This software may be modified and distributed under the terms
// of the NetBSD license. See the LICENSE file for details.
//
// TODO: current fa_sim_bitcomp_create uses a fa_sim_t, could be independent
// fa sim using compressed transition tables. Compression is done by storing
// when there is a change of destination state in the transition table. This
// is efficient when most states have few transitions.
//
// State memory looks like this:
//
// 256 bit transition change bitmap, 1=change, 0=no change
// sizeof(*void) accepting state opaque pointer
// 32 bit * N compressed transitions
//
// Lookup of next state is done by counting number of bits left of index
// (input byte) in change bitmap. Count is then use as offset into compressed
// transition table.
// first bit in change bitmap is always zero so it is used to indicates if
// state is accepting.
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <inttypes.h>
#include "fa_sim_bitcomp.h"
#include "fa_sim.h"
#define BITFIELD64_TEST(f,b) ((f)[(b)/64] & 1ULL<<(63-((b)&63)))
#define BITFIELD64_SET(f,b) ((f)[(b)/64] |= 1ULL<<(63-((b)&63)))
// only count if node is NULL
static uint32_t fa_sim_bitcomp_table_compress(uint32_t *in,
fa_sim_bitcomp_node_t *node,
uint32_t *locs) {
uint32_t prev = in[0];
int n = 1;
int i;
// always at least one value
if (node)
node->table[0] = locs[in[0]];
// skip 0, first bit i always zero (index 0)
for (i = 1; i < 256; i++) {
if (in[i] != prev) {
if (node) {
BITFIELD64_SET(node->bitmap, i);
node->table[n] = locs[in[i]];
}
prev = in[i];
n++;
}
}
return n;
}
fa_sim_bitcomp_t *fa_sim_bitcomp_create(fa_sim_t *sim) {
uint32_t size;
uint32_t i;
uint32_t *locs;
fa_sim_bitcomp_t *fsb;
// each fa_sim_t state iteration skips state 0, it is reserved for no match
// locs it used to store offset (in 64 bit steps) to each node
locs = malloc(sizeof(locs[0]) * sim->nodes_n);
locs[0] = 0; // fa_sim_t uses 0 as not match state, map it to 0
// size of header
size = sizeof(fa_sim_bitcomp_t);
// size state 0
size += sizeof(uint64_t);
// size rest of states
for (i = 1;i < sim->nodes_n; i++) {
locs[i] = (size - sizeof(fa_sim_bitcomp_t)) / sizeof(fsb->nodes[0]);
size +=
sizeof(fa_sim_bitcomp_node_t) +
sizeof(uint32_t) *
fa_sim_bitcomp_table_compress(sim->nodes[i].table, NULL, NULL);
// 64 bit align
if (size % 8 != 0)
size += 8 - (size % 8);
}
fsb = calloc(1, size);
fsb->size = size;
// store bitmap and tables
for (i = 1;i < sim->nodes_n; i++) {
fa_sim_bitcomp_node_t *fsbn =
(fa_sim_bitcomp_node_t*)&fsb->nodes[locs[i]];
fa_sim_bitcomp_table_compress(sim->nodes[i].table, fsbn, locs);
if (sim->nodes[i].flags & FA_SIM_NODE_F_ACCEPTING) {
BITFIELD64_SET(fsbn->bitmap, 0);
fsbn->opaque = sim->nodes[i].opaque;
}
}
fsb->start = locs[sim->start];
free(locs);
return fsb;
}
void fa_sim_bitcomp_destroy(fa_sim_bitcomp_t *fsb) {
free(fsb);
}
static uint32_t popcount_bitmap(uint64_t *bitmap, uint8_t index) {
int p, l;
// 2 highest bits is number of 64 bit maps we need to popcount
l = index >> 6;
// first map only popcount bits left of index
p = __builtin_popcountll(bitmap[l] >> (63 - (index & 63)));
// popcount rest of maps using jump table
switch(l) {
case 3: p += __builtin_popcountll(bitmap[--l]);
case 2: p += __builtin_popcountll(bitmap[--l]);
case 1: p += __builtin_popcountll(bitmap[--l]);
// case 0 is nop
}
// -1 to not count accepting bit
if (BITFIELD64_TEST(bitmap, 0))
p--;
return p;
}
void fa_sim_bitcomp_run_init(fa_sim_bitcomp_t *fsb, fa_sim_run_t *fsr) {
fsr->current = fsb->start;
}
int fa_sim_bitcomp_run(fa_sim_bitcomp_t *fsb, fa_sim_run_t *fsr,
uint8_t *data, int len) {
int i;
uint32_t current = fsr->current;
fa_sim_bitcomp_node_t *node =
(fa_sim_bitcomp_node_t*)&fsb->nodes[current];
for (i = 0; i < len; i++) {
current = node->table[popcount_bitmap(node->bitmap, data[i])];
node = (fa_sim_bitcomp_node_t*)&fsb->nodes[current];
if (current == 0)
return FA_SIM_RUN_REJECT;
}
if (BITFIELD64_TEST(node->bitmap, 0)) {
fsr->opaque = node->opaque;
return FA_SIM_RUN_ACCEPT;
}
fsr->current = current;
return FA_SIM_RUN_MORE;
}