2 * Copyright (C) 1994-1998, Index Data
4 * Sebastian Hammer, Adam Dickmeiss
7 * Revision 1.12 1999-05-26 07:49:14 adam
10 * Revision 1.11 1999/05/21 12:00:17 adam
11 * Better diagnostics for extraction process.
13 * Revision 1.10 1999/05/20 12:57:18 adam
14 * Implemented TCL filter. Updated recctrl system.
16 * Revision 1.9 1998/10/16 08:14:38 adam
17 * Updated record control system.
19 * Revision 1.8 1998/05/20 10:12:27 adam
20 * Implemented automatic EXPLAIN database maintenance.
21 * Modified Zebra to work with ASN.1 compiled version of YAZ.
23 * Revision 1.7 1998/03/11 11:19:05 adam
24 * Changed the way sequence numbers are generated.
26 * Revision 1.6 1998/02/10 12:03:06 adam
29 * Revision 1.5 1997/10/27 14:33:06 adam
30 * Moved towards generic character mapping depending on "structure"
31 * field in abstract syntax file. Fixed a few memory leaks. Fixed
32 * bug with negative integers when doing searches with relational
35 * Revision 1.4 1996/11/04 14:09:16 adam
38 * Revision 1.3 1996/11/01 09:00:33 adam
39 * This simple "text" format now supports element specs B and M.
41 * Revision 1.2 1996/10/29 14:02:45 adam
42 * Uses buffered read to speed up things.
44 * Revision 1.1 1996/10/11 10:57:28 adam
45 * New module recctrl. Used to manage records (extract/retrieval).
47 * Revision 1.7 1996/01/17 14:57:55 adam
48 * Prototype changed for reader functions in extract/retrieve. File
49 * is identified by 'void *' instead of 'int.
51 * Revision 1.6 1995/10/10 13:59:24 adam
52 * Function rset_open changed its wflag parameter to general flags.
54 * Revision 1.5 1995/10/02 16:24:39 adam
55 * Use attribute actually used in search requests.
57 * Revision 1.4 1995/10/02 15:42:55 adam
58 * Extract uses file descriptors instead of FILE pointers.
60 * Revision 1.3 1995/09/28 09:19:45 adam
61 * xfree/xmalloc used everywhere.
62 * Extract/retrieve method seems to work for text records.
64 * Revision 1.2 1995/09/15 14:45:21 adam
68 * Revision 1.1 1995/09/14 07:48:25 adam
69 * Record control management.
79 static void *text_init (RecType recType)
84 static void text_destroy (void *clientData)
89 struct recExtractCtrl *p;
95 struct buf_info *buf_open (struct recExtractCtrl *p)
97 struct buf_info *fi = (struct buf_info *) xmalloc (sizeof(*fi));
100 fi->buf = (char *) xmalloc (4096);
106 int buf_read (struct buf_info *fi, char *dst)
108 if (fi->offset >= fi->max)
112 fi->max = (*fi->p->readf)(fi->p->fh, fi->buf, 4096);
117 *dst = fi->buf[(fi->offset)++];
121 void buf_close (struct buf_info *fi)
127 static int text_extract (void *clientData, struct recExtractCtrl *p)
132 struct buf_info *fi = buf_open (p);
134 (*p->init)(p, &recWord);
135 recWord.reg_type = 'w';
140 r = buf_read (fi, w);
141 while (r > 0 && i < 511 && w[i] != '\n' && w[i] != '\r')
144 r = buf_read (fi, w + i);
150 (*p->addWord)(&recWord);
154 return RECCTRL_EXTRACT_OK;
157 static int text_retrieve (void *clientData, struct recRetrieveCtrl *p)
160 static char *text_buf = NULL;
161 static int text_size = 0;
163 const char *elementSetName = NULL;
166 if (p->comp && p->comp->which == Z_RecordComp_simple &&
167 p->comp->u.simple->which == Z_ElementSetNames_generic)
168 elementSetName = p->comp->u.simple->u.generic;
172 if (text_ptr + 4096 >= text_size)
176 text_size = 2*text_size + 8192;
177 nb = (char *) xmalloc (text_size);
180 memcpy (nb, text_buf, text_ptr);
190 sprintf (text_buf, "Rank: %d\n", p->score);
191 text_ptr = strlen(text_buf);
193 sprintf (text_buf + text_ptr, "Local Number: %d\n", p->localno);
194 text_ptr = strlen(text_buf);
196 r = (*p->readf)(p->fh, text_buf + text_ptr, 4096);
201 text_buf[text_ptr] = '\0';
204 if (!strcmp (elementSetName, "B"))
206 if (!strcmp (elementSetName, "M"))
214 while (++i <= no_lines && (p = strchr (p, '\n')))
219 text_ptr = p-text_buf;
222 p->output_format = VAL_SUTRS;
223 p->rec_buf = text_buf;
224 p->rec_len = text_ptr;
228 static struct recType text_type = {
236 RecType recTypeText = &text_type;