2 * Copyright (C) 1994-1998, Index Data
4 * Sebastian Hammer, Adam Dickmeiss
7 * Revision 1.11 1999-05-21 12:00:17 adam
8 * Better diagnostics for extraction process.
10 * Revision 1.10 1999/05/20 12:57:18 adam
11 * Implemented TCL filter. Updated recctrl system.
13 * Revision 1.9 1998/10/16 08:14:38 adam
14 * Updated record control system.
16 * Revision 1.8 1998/05/20 10:12:27 adam
17 * Implemented automatic EXPLAIN database maintenance.
18 * Modified Zebra to work with ASN.1 compiled version of YAZ.
20 * Revision 1.7 1998/03/11 11:19:05 adam
21 * Changed the way sequence numbers are generated.
23 * Revision 1.6 1998/02/10 12:03:06 adam
26 * Revision 1.5 1997/10/27 14:33:06 adam
27 * Moved towards generic character mapping depending on "structure"
28 * field in abstract syntax file. Fixed a few memory leaks. Fixed
29 * bug with negative integers when doing searches with relational
32 * Revision 1.4 1996/11/04 14:09:16 adam
35 * Revision 1.3 1996/11/01 09:00:33 adam
36 * This simple "text" format now supports element specs B and M.
38 * Revision 1.2 1996/10/29 14:02:45 adam
39 * Uses buffered read to speed up things.
41 * Revision 1.1 1996/10/11 10:57:28 adam
42 * New module recctrl. Used to manage records (extract/retrieval).
44 * Revision 1.7 1996/01/17 14:57:55 adam
45 * Prototype changed for reader functions in extract/retrieve. File
46 * is identified by 'void *' instead of 'int.
48 * Revision 1.6 1995/10/10 13:59:24 adam
49 * Function rset_open changed its wflag parameter to general flags.
51 * Revision 1.5 1995/10/02 16:24:39 adam
52 * Use attribute actually used in search requests.
54 * Revision 1.4 1995/10/02 15:42:55 adam
55 * Extract uses file descriptors instead of FILE pointers.
57 * Revision 1.3 1995/09/28 09:19:45 adam
58 * xfree/xmalloc used everywhere.
59 * Extract/retrieve method seems to work for text records.
61 * Revision 1.2 1995/09/15 14:45:21 adam
65 * Revision 1.1 1995/09/14 07:48:25 adam
66 * Record control management.
76 static void *text_init (RecType recType)
81 static void text_destroy (void *clientData)
86 struct recExtractCtrl *p;
92 struct buf_info *buf_open (struct recExtractCtrl *p)
94 struct buf_info *fi = xmalloc (sizeof(*fi));
97 fi->buf = xmalloc (4096);
103 int buf_read (struct buf_info *fi, char *dst)
105 if (fi->offset >= fi->max)
109 fi->max = (*fi->p->readf)(fi->p->fh, fi->buf, 4096);
114 *dst = fi->buf[(fi->offset)++];
118 void buf_close (struct buf_info *fi)
124 static int text_extract (void *clientData, struct recExtractCtrl *p)
129 struct buf_info *fi = buf_open (p);
131 (*p->init)(p, &recWord);
132 recWord.reg_type = 'w';
137 r = buf_read (fi, w);
138 while (r > 0 && i < 511 && w[i] != '\n' && w[i] != '\r')
141 r = buf_read (fi, w + i);
147 (*p->addWord)(&recWord);
151 return RECCTRL_EXTRACT_OK;
154 static int text_retrieve (void *clientData, struct recRetrieveCtrl *p)
157 static char *text_buf = NULL;
158 static int text_size = 0;
160 const char *elementSetName = NULL;
163 if (p->comp && p->comp->which == Z_RecordComp_simple &&
164 p->comp->u.simple->which == Z_ElementSetNames_generic)
165 elementSetName = p->comp->u.simple->u.generic;
169 if (text_ptr + 4096 >= text_size)
173 text_size = 2*text_size + 8192;
174 nb = xmalloc (text_size);
177 memcpy (nb, text_buf, text_ptr);
187 sprintf (text_buf, "Rank: %d\n", p->score);
188 text_ptr = strlen(text_buf);
190 sprintf (text_buf + text_ptr, "Local Number: %d\n", p->localno);
191 text_ptr = strlen(text_buf);
193 r = (*p->readf)(p->fh, text_buf + text_ptr, 4096);
198 text_buf[text_ptr] = '\0';
201 if (!strcmp (elementSetName, "B"))
203 if (!strcmp (elementSetName, "M"))
211 while (++i <= no_lines && (p = strchr (p, '\n')))
216 text_ptr = p-text_buf;
219 p->output_format = VAL_SUTRS;
220 p->rec_buf = text_buf;
221 p->rec_len = text_ptr;
225 static struct recType text_type = {
233 RecType recTypeText = &text_type;