blob: f555fb5e8daaf911d9e70ee6c8957435b82db63c (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
|
/* This file is part of the software similarity tester SIM.
Written by Dick Grune, Vrije Universiteit, Amsterdam.
$Id: idf.c,v 2.8 2005/02/20 17:03:00 dick Exp $
*/
#include <string.h>
#include "system.par"
#include "token.h"
#include "idf.h"
TOKEN
idf_in_list(
const char *str,
const struct idf list[],
unsigned int listsize,
TOKEN dflt
) {
register int first = 0;
register int last = (listsize / sizeof (struct idf)) - 1;
while (first < last) {
register int middle = (first + last) / 2;
if (strcmp(str, list[middle].id_tag) > 0) {
first = middle + 1;
}
else {
last = middle;
}
}
return (strcmp(str, list[first].id_tag) == 0
? list[first].id_tr
: dflt
);
}
TOKEN
idf_hashed(const char *str) {
register int32 h = 0;
/* let's be careful about ranges; if done wrong it's hard to debug */
while (*str) {
/* -1 <= h <= 2^31-1 */
h = (h << 1) + (*str++&0377);
/* -2^31 <= h <= 2^31-1 */
if (h < 0) {
/* -2^31 <= h <= -1 */
h += 2147483647; /* 2^31-1 */
/* -1 <= h <= 2^31-2 */
}
else {
/* 0 <= h <= 2^31-1 */
}
/* -1 <= h <= 2^31-1 */
}
/* -1 <= h <= 2^31-1 */
if (h < 0) {
/* h = -1 */
/* a very small chance, but all the same */
h = 0;
}
/* 0 <= h <= 2^31-1 */
h %= 253; /* 0 <= h < 253 */
return NORM(h + 1); /* 1 <= h < 254 */
/* this avoids SKIP (0) and EOL (255) */
}
|