2 * Copyright (C) 1994-1995, Index Data I/S
4 * Sebastian Hammer, Adam Dickmeiss
7 * Revision 1.9 1995-09-27 12:22:28 adam
8 * More work on extract in record control.
9 * Field name is not in isam keys but in prefix in dictionary words.
11 * Revision 1.8 1995/09/14 07:48:22 adam
12 * Record control management.
14 * Revision 1.7 1995/09/11 13:09:32 adam
15 * More work on relevance feedback.
17 * Revision 1.6 1995/09/08 14:52:27 adam
18 * Minor changes. Dictionary is lower case now.
20 * Revision 1.5 1995/09/06 16:11:16 adam
21 * Option: only one word key per file.
23 * Revision 1.4 1995/09/05 15:28:39 adam
24 * More work on search engine.
26 * Revision 1.3 1995/09/04 12:33:41 adam
27 * Various cleanup. YAZ util used instead.
29 * Revision 1.2 1995/09/04 09:10:34 adam
30 * More work on index add/del/update.
31 * Merge sort implemented.
32 * Initial work on z39 server.
34 * Revision 1.1 1995/09/01 14:06:35 adam
35 * Split of work into more files.
49 static SYSNO sysno_next;
50 static int key_fd = -1;
51 static int sys_idx_fd = -1;
53 static int key_offset, key_buf_size;
57 void key_open (const char *fname)
62 if ((key_fd = open (fname, O_RDWR|O_CREAT, 0666)) == -1)
64 logf (LOG_FATAL|LOG_ERRNO, "open %s", fname);
67 logf (LOG_DEBUG, "key_open of %s", fname);
69 key_buf = xmalloc (key_buf_size);
71 if (!(file_idx = dict_open (FNAME_FILE_DICT, 40, 1)))
73 logf (LOG_FATAL, "dict_open fail of %s", "fileidx");
76 file_key = dict_lookup (file_idx, ".");
78 memcpy (&sysno_next, (char*)file_key+1, sizeof(sysno_next));
81 if ((sys_idx_fd = open (FNAME_SYS_IDX, O_RDWR|O_CREAT, 0666)) == -1)
83 logf (LOG_FATAL|LOG_ERRNO, "open %s", FNAME_SYS_IDX);
92 logf (LOG_DEBUG, "key_close - but no file");
97 dict_insert (file_idx, ".", sizeof(sysno_next), &sysno_next);
98 dict_close (file_idx);
104 void wordFlush (int sysno)
111 while (i < key_offset)
113 w = write (key_fd, key_buf + i, key_offset - i);
116 logf (LOG_FATAL|LOG_ERRNO, "Write key fail");
124 static void wordInit (RecWord *p)
128 p->which = Word_String;
131 static void wordAdd (const RecWord *p)
138 if (key_offset + 1000 > key_buf_size)
143 new_key_buf = xmalloc (2*key_buf_size);
144 memcpy (new_key_buf, key_buf, key_offset);
146 key_buf = new_key_buf;
148 sprintf (wordPrefix, "%c%04d", p->attrSet + '0', p->attrUse);
149 strcpy (key_buf + key_offset, wordPrefix);
150 key_offset += strlen (wordPrefix);
154 for (i = 0; p->u.string[i]; i++)
155 key_buf[key_offset++] = index_char_cvt (p->u.string[i]);
156 key_buf[key_offset++] = '\0';
161 x = (key_cmd == 'a') ? 1 : 0;
162 memcpy (key_buf + key_offset, &x, 1);
165 key.sysno = key_sysno;
166 key.seqno = p->seqno;
167 memcpy (key_buf + key_offset, &key, sizeof(key));
168 key_offset += sizeof(key);
171 void file_extract (int cmd, const char *fname, const char *kname)
177 const char *file_type;
180 struct recExtractCtrl extractCtrl;
183 logf (LOG_DEBUG, "%c %s k=%s", cmd, fname, kname);
184 for (i = strlen(fname); --i >= 0; )
190 else if (fname[i] == '.')
192 strcpy (ext, fname+i+1);
195 sprintf (ext_res, "fileExtension.%s", ext);
196 if (!(file_type = res_get (common_resource, ext_res)))
199 file_info = dict_lookup (file_idx, kname);
202 sysno = sysno_next++;
203 dict_insert (file_idx, kname, sizeof(sysno), &sysno);
204 lseek (sys_idx_fd, sysno * SYS_IDX_ENTRY_LEN, SEEK_SET);
205 write (sys_idx_fd, kname, strlen(kname)+1);
208 memcpy (&sysno, (char*) file_info+1, sizeof(sysno));
210 if (!(inf = fopen (fname, "r")))
212 logf (LOG_WARN|LOG_ERRNO, "open %s", fname);
215 if (!(rt = recType_byName (file_type)))
217 extractCtrl.inf = inf;
218 extractCtrl.subType = "";
219 extractCtrl.init = wordInit;
220 extractCtrl.add = wordAdd;
223 (*rt->extract)(&extractCtrl);