2 * Copyright (C) 1994, Index Data I/S
4 * Sebastian Hammer, Adam Dickmeiss
7 * Revision 1.15 1995-09-04 12:33:31 adam
8 * Various cleanup. YAZ util used instead.
10 * Revision 1.14 1994/10/04 17:46:55 adam
11 * Function options now returns arg with error option.
13 * Revision 1.13 1994/10/04 12:08:05 adam
14 * Some bug fixes and some optimizations.
16 * Revision 1.12 1994/10/03 17:23:03 adam
17 * First version of dictionary lookup with regular expressions and errors.
19 * Revision 1.11 1994/09/28 13:07:09 adam
20 * Use log_mask_str now.
22 * Revision 1.10 1994/09/26 10:17:24 adam
25 * Revision 1.9 1994/09/22 14:43:56 adam
26 * First functional version of lookup with error correction. A 'range'
27 * specified the maximum number of insertions+deletions+substitutions.
29 * Revision 1.8 1994/09/22 10:43:44 adam
30 * Two versions of depend. Type 1 is the tail-type compatible with
31 * all make programs. Type 2 is the GNU make with include facility.
32 * Type 2 is default. depend rule chooses current rule.
34 * Revision 1.7 1994/09/19 16:34:26 adam
35 * Depend rule change. Minor changes in dicttest.c
37 * Revision 1.6 1994/09/16 15:39:12 adam
38 * Initial code of lookup - not tested yet.
40 * Revision 1.5 1994/09/06 13:05:14 adam
41 * Further development of insertion. Some special cases are
42 * not properly handled yet! assert(0) are put here. The
43 * binary search in each page definitely reduce usr CPU.
45 * Revision 1.4 1994/09/01 17:49:37 adam
46 * Removed stupid line. Work on insertion in dictionary. Not finished yet.
48 * Revision 1.3 1994/09/01 17:44:06 adam
49 * depend include change.
51 * Revision 1.2 1994/08/18 12:40:54 adam
52 * Some development of dictionary. Not finished at all!
54 * Revision 1.1 1994/08/16 16:26:47 adam
71 static int grep_handle (Dict_char *name, char *info)
74 printf ("%s\n", name);
78 int main (int argc, char **argv)
80 const char *name = NULL;
81 const char *inputfile = NULL;
82 const char *base = NULL;
89 char *grep_pattern = NULL;
91 int no_of_iterations = 0;
92 int no_of_new = 0, no_of_same = 0, no_of_change = 0;
93 int no_of_hits = 0, no_of_misses = 0;
99 fprintf (stderr, "usage:\n "
100 " %s [-r n] [-u] [-g pat] [-s n] [-v n] [-i f] [-w] [-c n]"
105 while ((ret = options ("r:ug:s:v:i:wc:", argv, argc, &arg)) != -2)
115 logf (LOG_FATAL, "too many files specified\n");
143 infosize = atoi(arg);
147 log_init (log_mask_str(arg), prog, NULL);
151 logf (LOG_FATAL, "Unknown option '-%s'", arg);
157 logf (LOG_FATAL, "no base and/or dictionary specified");
160 common_resource = res_open (base);
161 if (!common_resource)
163 logf (LOG_FATAL, "cannot open resource `%s'", base);
166 dict = dict_open (name, cache, rw);
169 logf (LOG_FATAL, "dict_open fail of `%s'", name);
178 memset (infobytes, 0, 120);
180 if (!(ipf = fopen(inputfile, "r")))
182 logf (LOG_FATAL|LOG_ERRNO, "cannot open %s", inputfile);
186 while (fgets (ipf_buf, 1023, ipf))
188 char *ipf_ptr = ipf_buf;
189 sprintf (infobytes, "%d", line);
190 for (;*ipf_ptr && *ipf_ptr != '\n';ipf_ptr++)
192 if (isalpha(*ipf_ptr) || *ipf_ptr == '_')
195 while (ipf_ptr[i] && (isalnum(ipf_ptr[i]) ||
202 switch(dict_insert (dict, ipf_ptr,
203 infosize, infobytes))
211 logf (LOG_LOG, "%s change\n", ipf_ptr);
215 logf (LOG_LOG, "%s duplicate\n", ipf_ptr);
224 cp = dict_lookup (dict, ipf_ptr);
233 dict_lookup_grep (dict, ipf_ptr, range, grep_handle);
251 logf (LOG_LOG, "Grepping '%s'", grep_pattern);
252 dict_lookup_grep (dict, grep_pattern, range, grep_handle);
256 logf (LOG_LOG, "Insertions.... %d", no_of_iterations);
257 logf (LOG_LOG, "No of new..... %d", no_of_new);
258 logf (LOG_LOG, "No of change.. %d", no_of_change);
259 logf (LOG_LOG, "No of same.... %d", no_of_same);
263 logf (LOG_LOG, "Lookups....... %d", no_of_iterations);
264 logf (LOG_LOG, "No of hits.... %d", no_of_hits);
265 logf (LOG_LOG, "No of misses.. %d", no_of_misses);
268 res_close (common_resource);