1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
|
/*
* Copyright 2005 Sun Microsystems, Inc. All rights reserved.
* Use is subject to license terms.
*/
/* Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T */
/* All Rights Reserved */
/*
* Copyright (c) 1980 Regents of the University of California.
* All rights reserved. The Berkeley software License Agreement
* specifies the terms and conditions for redistribution.
*/
#pragma ident "%Z%%M% %I% %E% SMI"
#include <stdio.h>
#include <locale.h>
#include <assert.h>
extern void err();
extern int newkeys();
extern int recopy();
extern void whash();
int
main(int argc, char *argv[])
{
/*
* Make inverted file indexes. Reads a stream from mkey which
* gives record pointer items and keys. Generates set of files
* a. NHASH pointers to file b.
* b. lists of record numbers.
* c. record pointer items.
*
* these files are named xxx.ia, xxx.ib, xxx.ic;
* where xxx is taken from arg1.
* If the files exist they are updated.
*/
FILE *fa, *fb, *fc, *fta, *ftb, *ftc;
FILE *fd = NULL;
int nhash = 256;
int appflg = 1;
int keepkey = 0, pipein = 0;
char nma[100], nmb[100], nmc[100], com[100], nmd[100];
char tmpa[20], tmpb[20], tmpc[20];
char *remove = NULL;
int chatty = 0, docs, hashes, fp[2], fr, fw, pfork, pwait, status;
int i, j, k;
long keys;
int iflong = 0;
char *sortdir;
(void) setlocale(LC_ALL, "");
#if !defined(TEXT_DOMAIN)
#define TEXT_DOMAIN "SYS_TEST"
#endif
(void) textdomain(TEXT_DOMAIN);
sortdir = (access("/crp/tmp", 06) == 0) ? "/crp/tmp" : "/usr/tmp";
while (argc > 1 && argv[1][0] == '-') {
switch (argv[1][1]) {
case 'h': /* size of hash table */
nhash = atoi(argv[1]+2);
break;
case 'n': /* new, don't append */
appflg = 0;
break;
case 'a': /* append to old file */
appflg = 1;
break;
case 'v': /* verbose output */
chatty = 1;
break;
case 'd': /* keep keys on file .id for check on searching */
keepkey = 1;
break;
case 'p': /* pipe into sort (saves space, costs time) */
pipein = 1;
break;
case 'i': /* input is on file, not stdin */
close(0);
if (open(argv[2], 0) != 0)
err(gettext("Can't read input %s"), argv[2]);
if (argv[1][2] == 'u') /* unlink */
remove = argv[2];
argc--;
argv++;
break;
}
argc--;
argv++;
}
strcpy(nma, argc >= 2 ? argv[1] : "Index");
strcpy(nmb, nma);
strcpy(nmc, nma);
strcpy(nmd, nma);
strcat(nma, ".ia");
strcat(nmb, ".ib");
strcat(nmc, ".ic");
strcat(nmd, ".id");
sprintf(tmpa, "junk%di", getpid());
if (pipein) {
sprintf(com, "/usr/bin/sort -T %s -o %s", sortdir, tmpa);
fta = popen(com, "w");
} else { /* use tmp file */
fta = fopen(tmpa, "w");
assert(fta != NULL);
}
fb = 0;
if (appflg) {
if (fb = fopen(nmb, "r")) {
sprintf(tmpb, "junk%dj", getpid());
ftb = fopen(tmpb, "w");
if (ftb == NULL)
err(gettext("Can't get scratch file %s"), tmpb);
nhash = recopy(ftb, fb, fopen(nma, "r"));
fclose(ftb);
} else
appflg = 0;
}
fc = fopen(nmc, appflg ? "a" : "w");
if (keepkey)
fd = keepkey ? fopen(nmd, "w") : 0;
docs = newkeys(fta, stdin, fc, nhash, fd, &iflong);
fclose(stdin);
if (remove != NULL)
unlink(remove);
fclose(fta);
if (pipein) {
pclose(fta);
}
else
{
sprintf(com, "sort -T %s %s -o %s", sortdir, tmpa, tmpa);
system(com);
}
if (appflg) {
sprintf(tmpc, "junk%dk", getpid());
sprintf(com, "mv %s %s", tmpa, tmpc);
system(com);
sprintf(com, "sort -T %s -m %s %s -o %s", sortdir,
tmpb, tmpc, tmpa);
system(com);
}
fta = fopen(tmpa, "r");
fa = fopen(nma, "w");
fb = fopen(nmb, "w");
whash(fta, fa, fb, nhash, iflong, &keys, &hashes);
fclose(fta);
#ifndef D1
unlink(tmpa);
#endif
if (appflg) {
unlink(tmpb);
unlink(tmpc);
}
if (chatty)
printf(gettext("%ld key occurrences, %d hashes, %d docs\n"),
keys, hashes, docs);
return (0);
}
|