1 /* $Id: extract.c,v 1.177 2005-03-17 09:48:46 adam Exp $
2 Copyright (C) 1995-2005
5 This file is part of the Zebra server.
7 Zebra is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
12 Zebra is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 You should have received a copy of the GNU General Public License
18 along with Zebra; see the file LICENSE.zebra. If not, write to the
19 Free Software Foundation, 59 Temple Place - Suite 330, Boston, MA
37 #if _FILE_OFFSET_BITS == 64
38 #define PRINTF_OFF_T "%Ld"
40 #define PRINTF_OFF_T "%ld"
43 #define USE_SHELLSORT 0
46 static void shellsort(void *ar, int r, size_t s,
47 int (*cmp)(const void *a, const void *b))
52 static const int incs[16] = { 1391376, 463792, 198768, 86961, 33936,
53 13776, 4592, 1968, 861, 336,
54 112, 48, 21, 7, 3, 1 };
55 for ( k = 0; k < 16; k++)
56 for (h = incs[k], i = h; i < r; i++)
60 while (j > h && (*cmp)(a + s*(j-h), v) > 0)
62 memcpy (a + s*j, a + s*(j-h), s);
70 static void logRecord (ZebraHandle zh)
72 ++zh->records_processed;
73 if (!(zh->records_processed % 1000))
75 yaz_log (YLOG_LOG, "Records: "ZINT_FORMAT" i/u/d "
76 ZINT_FORMAT"/"ZINT_FORMAT"/"ZINT_FORMAT,
77 zh->records_processed, zh->records_inserted, zh->records_updated,
82 static void extract_init (struct recExtractCtrl *p, RecWord *w)
84 w->zebra_maps = p->zebra_maps;
86 w->attrSet = VAL_BIB1;
95 static const char **searchRecordKey (ZebraHandle zh,
96 struct recKeys *reckeys,
97 int attrSetS, int attrUseS)
99 static const char *ws[32];
100 void *decode_handle = iscz1_start();
106 for (i = 0; i<32; i++)
109 while (off < reckeys->buf_used)
111 const char *src = reckeys->buf + off;
113 char *dst = (char*) &key;
114 int attrSet, attrUse;
116 iscz1_decode(decode_handle, &dst, &src);
117 assert(key.len < 4 && key.len > 2);
119 attrSet = (int) key.mem[0] >> 16;
120 attrUse = (int) key.mem[0] & 65535;
121 seqno = (int) key.mem[key.len-1];
123 if (attrUseS == attrUse && attrSetS == attrSet)
129 woff = seqno - startSeq;
130 if (woff >= 0 && woff < 31)
136 off = src - reckeys->buf;
138 iscz1_stop(decode_handle);
139 assert (off == reckeys->buf_used);
143 struct file_read_info {
144 off_t file_max; /* maximum offset so far */
145 off_t file_offset; /* current offset */
146 off_t file_moffset; /* offset of rec/rec boundary */
153 static struct file_read_info *file_read_start (int fd)
155 struct file_read_info *fi = (struct file_read_info *)
156 xmalloc (sizeof(*fi));
160 fi->file_moffset = 0;
166 static void file_read_stop (struct file_read_info *fi)
171 static off_t file_seek (void *handle, off_t offset)
173 struct file_read_info *p = (struct file_read_info *) handle;
174 p->file_offset = offset;
177 return lseek (p->fd, offset, SEEK_SET);
180 static off_t file_tell (void *handle)
182 struct file_read_info *p = (struct file_read_info *) handle;
183 return p->file_offset;
186 static int file_read (void *handle, char *buf, size_t count)
188 struct file_read_info *p = (struct file_read_info *) handle;
194 if (r > p->sdrmax - p->file_offset)
195 r = p->sdrmax - p->file_offset;
197 memcpy (buf, p->sdrbuf + p->file_offset, r);
200 r = read (fd, buf, count);
204 if (p->file_offset > p->file_max)
205 p->file_max = p->file_offset;
210 static void file_begin (void *handle)
212 struct file_read_info *p = (struct file_read_info *) handle;
214 p->file_offset = p->file_moffset;
215 if (!p->sdrbuf && p->file_moffset)
216 lseek (p->fd, p->file_moffset, SEEK_SET);
220 static void file_end (void *handle, off_t offset)
222 struct file_read_info *p = (struct file_read_info *) handle;
224 assert (p->file_more == 0);
226 p->file_moffset = offset;
229 static char *fileMatchStr (ZebraHandle zh,
230 struct recKeys *reckeys,
231 const char *fname, const char *spec)
233 static char dstBuf[2048]; /* static here ??? */
235 const char *s = spec;
236 static const char **w;
240 while (*s == ' ' || *s == '\t')
246 char attset_str[64], attname_str[64];
247 data1_attset *attset;
250 int attSet = 1, attUse = 1;
254 for (i = 0; *s && *s != ',' && *s != ')'; s++)
256 attset_str[i++] = *s;
257 attset_str[i] = '\0';
262 for (i = 0; *s && *s != ')'; s++)
264 attname_str[i++] = *s;
265 attname_str[i] = '\0';
268 if ((attset = data1_get_attset (zh->reg->dh, attset_str)))
271 attSet = attset->reference;
272 att = data1_getattbyname(zh->reg->dh, attset, attname_str);
276 attUse = atoi (attname_str);
278 w = searchRecordKey (zh, reckeys, attSet, attUse);
283 for (i = 0; i<32; i++)
288 yaz_log (YLOG_WARN, "Missing ) in match criteria %s in group %s",
289 spec, zh->m_group ? zh->m_group : "none");
294 for (i = 0; i<32; i++)
295 if (matchFlag[i] && w[i])
307 yaz_log (YLOG_WARN, "Record didn't contain match"
308 " fields in (%s,%s)", attset_str, attname_str);
316 const char *spec_src = NULL;
317 const char *s1 = ++s;
318 while (*s1 && *s1 != ' ' && *s1 != '\t')
324 memcpy (special, s, spec_len);
325 special[spec_len] = '\0';
328 if (!strcmp (special, "group"))
329 spec_src = zh->m_group;
330 else if (!strcmp (special, "database"))
331 spec_src = zh->basenames[0];
332 else if (!strcmp (special, "filename")) {
335 else if (!strcmp (special, "type"))
336 spec_src = zh->m_record_type;
341 strcpy (dst, spec_src);
342 dst += strlen (spec_src);
345 else if (*s == '\"' || *s == '\'')
347 int stopMarker = *s++;
351 while (*s && *s != stopMarker)
354 tmpString[i++] = *s++;
359 strcpy (dst, tmpString);
360 dst += strlen (tmpString);
364 yaz_log (YLOG_WARN, "Syntax error in match criteria %s in group %s",
365 spec, zh->m_group ? zh->m_group : "none");
372 yaz_log (YLOG_WARN, "No match criteria for record %s in group %s",
373 fname, zh->m_group ? zh->m_group : "none");
380 struct recordLogInfo {
383 struct recordGroup *rGroup;
386 void create_rec_keys_codec(struct recKeys *keys)
389 iscz1_reset(keys->codec_handle);
392 static int file_extract_record(ZebraHandle zh,
393 SYSNO *sysno, const char *fname,
395 struct file_read_info *fi,
398 RecordAttr *recordAttr;
400 const char *matchStr = 0;
403 off_t recordOffset = 0;
408 recType_byName (zh->reg->recTypes, zh->res, zh->m_record_type,
411 yaz_log (YLOG_WARN, "No such record type: %s", zh->m_record_type);
415 /* announce database */
416 if (zebraExplain_curDatabase (zh->reg->zei, zh->basenames[0]))
418 if (zebraExplain_newDatabase (zh->reg->zei, zh->basenames[0],
419 zh->m_explain_database))
425 struct recExtractCtrl extractCtrl;
427 /* we are going to read from a file, so prepare the extraction */
430 create_rec_keys_codec(&zh->reg->keys);
432 zh->reg->sortKeys.buf_used = 0;
434 recordOffset = fi->file_moffset;
435 extractCtrl.offset = fi->file_moffset;
436 extractCtrl.readf = file_read;
437 extractCtrl.seekf = file_seek;
438 extractCtrl.tellf = file_tell;
439 extractCtrl.endf = file_end;
441 extractCtrl.init = extract_init;
442 extractCtrl.tokenAdd = extract_token_add;
443 extractCtrl.schemaAdd = extract_schema_add;
444 extractCtrl.dh = zh->reg->dh;
445 extractCtrl.match_criteria[0] = '\0';
446 extractCtrl.handle = zh;
447 for (i = 0; i<256; i++)
449 if (zebra_maps_is_positioned(zh->reg->zebra_maps, i))
450 extractCtrl.seqno[i] = 1;
452 extractCtrl.seqno[i] = 0;
454 extractCtrl.zebra_maps = zh->reg->zebra_maps;
455 extractCtrl.flagShowRecords = !zh->m_flag_rw;
458 printf ("File: %s " PRINTF_OFF_T "\n", fname, recordOffset);
462 sprintf (msg, "%s:" PRINTF_OFF_T , fname, recordOffset);
463 yaz_log_init_prefix2 (msg);
466 r = (*recType->extract)(clientData, &extractCtrl);
468 yaz_log_init_prefix2 (0);
469 if (r == RECCTRL_EXTRACT_EOF)
471 else if (r == RECCTRL_EXTRACT_ERROR_GENERIC)
473 /* error occured during extraction ... */
475 zh->records_processed < zh->m_file_verbose_limit)
477 yaz_log (YLOG_WARN, "fail %s %s " PRINTF_OFF_T, zh->m_record_type,
478 fname, recordOffset);
482 else if (r == RECCTRL_EXTRACT_ERROR_NO_SUCH_FILTER)
484 /* error occured during extraction ... */
486 zh->records_processed < zh->m_file_verbose_limit)
488 yaz_log (YLOG_WARN, "no filter for %s %s "
489 PRINTF_OFF_T, zh->m_record_type,
490 fname, recordOffset);
494 if (extractCtrl.match_criteria[0])
495 matchStr = extractCtrl.match_criteria;
498 /* perform match if sysno not known and if match criteria is specified */
504 if (matchStr == 0 && zh->m_record_id && *zh->m_record_id)
507 matchStr = fileMatchStr (zh, &zh->reg->keys, fname,
511 yaz_log(YLOG_WARN, "Bad match criteria");
517 char *rinfo = dict_lookup (zh->reg->matchDict, matchStr);
520 assert(*rinfo == sizeof(*sysno));
521 memcpy (sysno, rinfo+1, sizeof(*sysno));
525 if (! *sysno && zh->reg->keys.buf_used == 0)
527 /* the extraction process returned no information - the record
528 is probably empty - unless flagShowRecords is in use */
532 if (zh->records_processed < zh->m_file_verbose_limit)
533 yaz_log (YLOG_WARN, "empty %s %s " PRINTF_OFF_T, zh->m_record_type,
534 fname, recordOffset);
543 yaz_log (YLOG_LOG, "delete %s %s " PRINTF_OFF_T, zh->m_record_type,
544 fname, recordOffset);
545 yaz_log (YLOG_WARN, "cannot delete record above (seems new)");
548 if (zh->records_processed < zh->m_file_verbose_limit)
549 yaz_log (YLOG_LOG, "add %s %s " PRINTF_OFF_T, zh->m_record_type,
550 fname, recordOffset);
551 rec = rec_new (zh->reg->records);
555 recordAttr = rec_init_attr (zh->reg->zei, rec);
559 dict_insert (zh->reg->matchDict, matchStr, sizeof(*sysno), sysno);
561 extract_flushSortKeys (zh, *sysno, 1, &zh->reg->sortKeys);
562 extract_flushRecordKeys (zh, *sysno, 1, &zh->reg->keys);
564 zh->records_inserted++;
568 /* record already exists */
569 struct recKeys delkeys;
570 struct sortKeys sortKeys;
572 rec = rec_get (zh->reg->records, *sysno);
575 recordAttr = rec_init_attr (zh->reg->zei, rec);
577 if (!force_update && recordAttr->runNumber ==
578 zebraExplain_runNumberIncrement (zh->reg->zei, 0))
580 yaz_log (YLOG_LOG, "run number = " ZINT_FORMAT,
581 recordAttr->runNumber);
582 yaz_log (YLOG_LOG, "skipped %s %s " PRINTF_OFF_T,
583 zh->m_record_type, fname, recordOffset);
584 extract_flushSortKeys (zh, *sysno, -1, &zh->reg->sortKeys);
589 delkeys.buf_used = rec->size[recInfo_delKeys];
590 delkeys.buf = rec->info[recInfo_delKeys];
592 sortKeys.buf_used = rec->size[recInfo_sortKeys];
593 sortKeys.buf = rec->info[recInfo_sortKeys];
595 extract_flushSortKeys (zh, *sysno, 0, &sortKeys);
596 extract_flushRecordKeys (zh, *sysno, 0, &delkeys);
599 /* record going to be deleted */
600 if (!delkeys.buf_used)
602 yaz_log (YLOG_LOG, "delete %s %s " PRINTF_OFF_T,
603 zh->m_record_type, fname, recordOffset);
604 yaz_log (YLOG_WARN, "cannot delete file above, storeKeys false");
608 if (zh->records_processed < zh->m_file_verbose_limit)
609 yaz_log (YLOG_LOG, "delete %s %s " PRINTF_OFF_T,
610 zh->m_record_type, fname, recordOffset);
611 zh->records_deleted++;
613 dict_delete (zh->reg->matchDict, matchStr);
614 rec_del (zh->reg->records, &rec);
622 /* record going to be updated */
623 if (!delkeys.buf_used)
625 yaz_log (YLOG_LOG, "update %s %s " PRINTF_OFF_T,
626 zh->m_record_type, fname, recordOffset);
627 yaz_log (YLOG_WARN, "cannot update file above, storeKeys false");
631 if (zh->records_processed < zh->m_file_verbose_limit)
632 yaz_log (YLOG_LOG, "update %s %s " PRINTF_OFF_T,
633 zh->m_record_type, fname, recordOffset);
634 extract_flushSortKeys (zh, *sysno, 1, &zh->reg->sortKeys);
635 extract_flushRecordKeys (zh, *sysno, 1, &zh->reg->keys);
636 zh->records_updated++;
640 /* update file type */
641 xfree (rec->info[recInfo_fileType]);
642 rec->info[recInfo_fileType] =
643 rec_strdup (zh->m_record_type, &rec->size[recInfo_fileType]);
645 /* update filename */
646 xfree (rec->info[recInfo_filename]);
647 rec->info[recInfo_filename] =
648 rec_strdup (fname, &rec->size[recInfo_filename]);
650 /* update delete keys */
651 xfree (rec->info[recInfo_delKeys]);
652 if (zh->reg->keys.buf_used > 0 && zh->m_store_keys == 1)
654 rec->size[recInfo_delKeys] = zh->reg->keys.buf_used;
655 rec->info[recInfo_delKeys] = zh->reg->keys.buf;
656 zh->reg->keys.buf = NULL;
657 zh->reg->keys.buf_max = 0;
661 rec->info[recInfo_delKeys] = NULL;
662 rec->size[recInfo_delKeys] = 0;
665 /* update sort keys */
666 xfree (rec->info[recInfo_sortKeys]);
668 rec->size[recInfo_sortKeys] = zh->reg->sortKeys.buf_used;
669 rec->info[recInfo_sortKeys] = zh->reg->sortKeys.buf;
670 zh->reg->sortKeys.buf = NULL;
671 zh->reg->sortKeys.buf_max = 0;
673 /* save file size of original record */
674 zebraExplain_recordBytesIncrement (zh->reg->zei,
675 - recordAttr->recordSize);
676 recordAttr->recordSize = fi->file_moffset - recordOffset;
677 if (!recordAttr->recordSize)
678 recordAttr->recordSize = fi->file_max - recordOffset;
679 zebraExplain_recordBytesIncrement (zh->reg->zei,
680 recordAttr->recordSize);
682 /* set run-number for this record */
683 recordAttr->runNumber = zebraExplain_runNumberIncrement (zh->reg->zei,
686 /* update store data */
687 xfree (rec->info[recInfo_storeData]);
688 if (zh->m_store_data)
690 rec->size[recInfo_storeData] = recordAttr->recordSize;
691 rec->info[recInfo_storeData] = (char *)
692 xmalloc (recordAttr->recordSize);
693 if (lseek (fi->fd, recordOffset, SEEK_SET) < 0)
695 yaz_log (YLOG_ERRNO|YLOG_FATAL, "seek to " PRINTF_OFF_T " in %s",
696 recordOffset, fname);
699 if (read (fi->fd, rec->info[recInfo_storeData], recordAttr->recordSize)
700 < recordAttr->recordSize)
702 yaz_log (YLOG_ERRNO|YLOG_FATAL, "read %d bytes of %s",
703 recordAttr->recordSize, fname);
709 rec->info[recInfo_storeData] = NULL;
710 rec->size[recInfo_storeData] = 0;
712 /* update database name */
713 xfree (rec->info[recInfo_databaseName]);
714 rec->info[recInfo_databaseName] =
715 rec_strdup (zh->basenames[0], &rec->size[recInfo_databaseName]);
718 recordAttr->recordOffset = recordOffset;
720 /* commit this record */
721 rec_put (zh->reg->records, &rec);
726 int fileExtract (ZebraHandle zh, SYSNO *sysno, const char *fname,
733 struct file_read_info *fi;
734 const char *original_record_type = 0;
736 if (!zh->m_group || !*zh->m_group)
739 sprintf (gprefix, "%s.", zh->m_group);
741 yaz_log (YLOG_DEBUG, "fileExtract %s", fname);
743 /* determine file extension */
745 for (i = strlen(fname); --i >= 0; )
748 else if (fname[i] == '.')
750 strcpy (ext, fname+i+1);
753 /* determine file type - depending on extension */
754 original_record_type = zh->m_record_type;
755 if (!zh->m_record_type)
757 sprintf (ext_res, "%srecordType.%s", gprefix, ext);
758 zh->m_record_type = res_get (zh->res, ext_res);
760 if (!zh->m_record_type)
762 if (zh->records_processed < zh->m_file_verbose_limit)
763 yaz_log (YLOG_LOG, "? %s", fname);
766 /* determine match criteria */
767 if (!zh->m_record_id)
769 sprintf (ext_res, "%srecordId.%s", gprefix, ext);
770 zh->m_record_id = res_get (zh->res, ext_res);
773 if (sysno && deleteFlag)
779 if (zh->path_reg && !yaz_is_abspath (fname))
781 strcpy (full_rep, zh->path_reg);
782 strcat (full_rep, "/");
783 strcat (full_rep, fname);
786 strcpy (full_rep, fname);
789 if ((fd = open (full_rep, O_BINARY|O_RDONLY)) == -1)
791 yaz_log (YLOG_WARN|YLOG_ERRNO, "open %s", full_rep);
792 zh->m_record_type = original_record_type;
796 fi = file_read_start (fd);
800 r = file_extract_record (zh, sysno, fname, deleteFlag, fi, 1);
801 } while (r && !sysno && fi->file_more);
805 zh->m_record_type = original_record_type;
810 If sysno is provided, then it's used to identify the reocord.
811 If not, and match_criteria is provided, then sysno is guessed
812 If not, and a record is provided, then sysno is got from there
815 int buffer_extract_record (ZebraHandle zh,
816 const char *buf, size_t buf_size,
819 const char *recordType,
821 const char *match_criteria,
826 RecordAttr *recordAttr;
827 struct recExtractCtrl extractCtrl;
829 const char *matchStr = 0;
830 RecType recType = NULL;
833 long recordOffset = 0;
834 struct zebra_fetch_control fc;
835 const char *pr_fname = fname; /* filename to print .. */
836 int show_progress = zh->records_processed < zh->m_file_verbose_limit ? 1:0;
839 pr_fname = "<no file>"; /* make it printable if file is omitted */
842 fc.record_int_buf = buf;
843 fc.record_int_len = buf_size;
844 fc.record_int_pos = 0;
846 fc.record_offset = 0;
848 extractCtrl.offset = 0;
849 extractCtrl.readf = zebra_record_int_read;
850 extractCtrl.seekf = zebra_record_int_seek;
851 extractCtrl.tellf = zebra_record_int_tell;
852 extractCtrl.endf = zebra_record_int_end;
853 extractCtrl.fh = &fc;
855 create_rec_keys_codec(&zh->reg->keys);
857 zh->reg->sortKeys.buf_used = 0;
859 if (zebraExplain_curDatabase (zh->reg->zei, zh->basenames[0]))
861 if (zebraExplain_newDatabase (zh->reg->zei, zh->basenames[0],
862 zh->m_explain_database))
866 if (recordType && *recordType) {
867 yaz_log (YLOG_DEBUG, "Record type explicitly specified: %s", recordType);
868 recType = recType_byName (zh->reg->recTypes, zh->res, recordType,
871 if (!(zh->m_record_type)) {
872 yaz_log (YLOG_WARN, "No such record type defined");
875 yaz_log (YLOG_DEBUG, "Get record type from rgroup: %s",zh->m_record_type);
876 recType = recType_byName (zh->reg->recTypes, zh->res,
877 zh->m_record_type, &clientData);
878 recordType = zh->m_record_type;
882 yaz_log (YLOG_WARN, "No such record type: %s", zh->m_record_type);
886 extractCtrl.init = extract_init;
887 extractCtrl.tokenAdd = extract_token_add;
888 extractCtrl.schemaAdd = extract_schema_add;
889 extractCtrl.dh = zh->reg->dh;
890 extractCtrl.handle = zh;
891 extractCtrl.zebra_maps = zh->reg->zebra_maps;
892 extractCtrl.flagShowRecords = 0;
893 extractCtrl.match_criteria[0] = '\0';
894 for (i = 0; i<256; i++)
896 if (zebra_maps_is_positioned(zh->reg->zebra_maps, i))
897 extractCtrl.seqno[i] = 1;
899 extractCtrl.seqno[i] = 0;
902 r = (*recType->extract)(clientData, &extractCtrl);
904 if (r == RECCTRL_EXTRACT_EOF)
906 else if (r == RECCTRL_EXTRACT_ERROR_GENERIC)
908 /* error occured during extraction ... */
909 yaz_log (YLOG_WARN, "extract error: generic");
912 else if (r == RECCTRL_EXTRACT_ERROR_NO_SUCH_FILTER)
914 /* error occured during extraction ... */
915 yaz_log (YLOG_WARN, "extract error: no such filter");
921 if (extractCtrl.match_criteria[0])
922 match_criteria = extractCtrl.match_criteria;
926 if (match_criteria && *match_criteria) {
927 matchStr = match_criteria;
929 if (zh->m_record_id && *zh->m_record_id) {
930 matchStr = fileMatchStr (zh, &zh->reg->keys, pr_fname,
934 yaz_log (YLOG_WARN, "Bad match criteria (recordID)");
940 rinfo = dict_lookup (zh->reg->matchDict, matchStr);
943 assert(*rinfo == sizeof(*sysno));
944 memcpy (sysno, rinfo+1, sizeof(*sysno));
948 if (zh->reg->keys.buf_used == 0)
950 /* the extraction process returned no information - the record
951 is probably empty - unless flagShowRecords is in use */
962 yaz_log (YLOG_LOG, "delete %s %s %ld", recordType,
963 pr_fname, (long) recordOffset);
964 yaz_log (YLOG_WARN, "cannot delete record above (seems new)");
968 yaz_log (YLOG_LOG, "add %s %s %ld", recordType, pr_fname,
969 (long) recordOffset);
970 rec = rec_new (zh->reg->records);
974 recordAttr = rec_init_attr (zh->reg->zei, rec);
978 dict_insert (zh->reg->matchDict, matchStr,
979 sizeof(*sysno), sysno);
981 extract_flushSortKeys (zh, *sysno, 1, &zh->reg->sortKeys);
982 extract_flushRecordKeys (zh, *sysno, 1, &zh->reg->keys);
984 zh->records_inserted++;
988 /* record already exists */
989 struct recKeys delkeys;
990 struct sortKeys sortKeys;
995 yaz_log (YLOG_LOG, "skipped %s %s %ld",
996 recordType, pr_fname, (long) recordOffset);
1001 rec = rec_get (zh->reg->records, *sysno);
1004 recordAttr = rec_init_attr (zh->reg->zei, rec);
1006 if (!force_update) {
1007 if (recordAttr->runNumber ==
1008 zebraExplain_runNumberIncrement (zh->reg->zei, 0))
1011 yaz_log (YLOG_LOG, "skipped %s %s %ld", recordType,
1012 pr_fname, (long) recordOffset);
1013 extract_flushSortKeys (zh, *sysno, -1, &zh->reg->sortKeys);
1020 delkeys.buf_used = rec->size[recInfo_delKeys];
1021 delkeys.buf = rec->info[recInfo_delKeys];
1023 sortKeys.buf_used = rec->size[recInfo_sortKeys];
1024 sortKeys.buf = rec->info[recInfo_sortKeys];
1026 extract_flushSortKeys (zh, *sysno, 0, &sortKeys);
1027 extract_flushRecordKeys (zh, *sysno, 0, &delkeys);
1030 /* record going to be deleted */
1031 if (!delkeys.buf_used)
1035 yaz_log (YLOG_LOG, "delete %s %s %ld", recordType,
1036 pr_fname, (long) recordOffset);
1037 yaz_log (YLOG_WARN, "cannot delete file above, "
1044 yaz_log (YLOG_LOG, "delete %s %s %ld", recordType,
1045 pr_fname, (long) recordOffset);
1046 zh->records_deleted++;
1048 dict_delete (zh->reg->matchDict, matchStr);
1049 rec_del (zh->reg->records, &rec);
1057 /* record going to be updated */
1058 if (!delkeys.buf_used)
1062 yaz_log (YLOG_LOG, "update %s %s %ld", recordType,
1063 pr_fname, (long) recordOffset);
1064 yaz_log (YLOG_WARN, "cannot update file above, storeKeys false");
1070 yaz_log (YLOG_LOG, "update %s %s %ld", recordType,
1071 pr_fname, (long) recordOffset);
1072 extract_flushSortKeys (zh, *sysno, 1, &zh->reg->sortKeys);
1073 extract_flushRecordKeys (zh, *sysno, 1, &zh->reg->keys);
1074 zh->records_updated++;
1078 /* update file type */
1079 xfree (rec->info[recInfo_fileType]);
1080 rec->info[recInfo_fileType] =
1081 rec_strdup (recordType, &rec->size[recInfo_fileType]);
1083 /* update filename */
1084 xfree (rec->info[recInfo_filename]);
1085 rec->info[recInfo_filename] =
1086 rec_strdup (fname, &rec->size[recInfo_filename]);
1088 /* update delete keys */
1089 xfree (rec->info[recInfo_delKeys]);
1090 if (zh->reg->keys.buf_used > 0 && zh->m_store_keys == 1)
1092 rec->size[recInfo_delKeys] = zh->reg->keys.buf_used;
1093 rec->info[recInfo_delKeys] = zh->reg->keys.buf;
1094 zh->reg->keys.buf = NULL;
1095 zh->reg->keys.buf_max = 0;
1099 rec->info[recInfo_delKeys] = NULL;
1100 rec->size[recInfo_delKeys] = 0;
1103 /* update sort keys */
1104 xfree (rec->info[recInfo_sortKeys]);
1106 rec->size[recInfo_sortKeys] = zh->reg->sortKeys.buf_used;
1107 rec->info[recInfo_sortKeys] = zh->reg->sortKeys.buf;
1108 zh->reg->sortKeys.buf = NULL;
1109 zh->reg->sortKeys.buf_max = 0;
1111 /* save file size of original record */
1112 zebraExplain_recordBytesIncrement (zh->reg->zei,
1113 - recordAttr->recordSize);
1115 recordAttr->recordSize = fi->file_moffset - recordOffset;
1116 if (!recordAttr->recordSize)
1117 recordAttr->recordSize = fi->file_max - recordOffset;
1119 recordAttr->recordSize = buf_size;
1121 zebraExplain_recordBytesIncrement (zh->reg->zei,
1122 recordAttr->recordSize);
1124 /* set run-number for this record */
1125 recordAttr->runNumber =
1126 zebraExplain_runNumberIncrement (zh->reg->zei, 0);
1128 /* update store data */
1129 xfree (rec->info[recInfo_storeData]);
1130 if (zh->m_store_data)
1132 rec->size[recInfo_storeData] = recordAttr->recordSize;
1133 rec->info[recInfo_storeData] = (char *)
1134 xmalloc (recordAttr->recordSize);
1135 memcpy (rec->info[recInfo_storeData], buf, recordAttr->recordSize);
1139 rec->info[recInfo_storeData] = NULL;
1140 rec->size[recInfo_storeData] = 0;
1142 /* update database name */
1143 xfree (rec->info[recInfo_databaseName]);
1144 rec->info[recInfo_databaseName] =
1145 rec_strdup (zh->basenames[0], &rec->size[recInfo_databaseName]);
1148 recordAttr->recordOffset = recordOffset;
1150 /* commit this record */
1151 rec_put (zh->reg->records, &rec);
1156 int explain_extract (void *handle, Record rec, data1_node *n)
1158 ZebraHandle zh = (ZebraHandle) handle;
1159 struct recExtractCtrl extractCtrl;
1162 if (zebraExplain_curDatabase (zh->reg->zei,
1163 rec->info[recInfo_databaseName]))
1166 if (zebraExplain_newDatabase (zh->reg->zei,
1167 rec->info[recInfo_databaseName], 0))
1171 create_rec_keys_codec(&zh->reg->keys);
1173 zh->reg->sortKeys.buf_used = 0;
1175 extractCtrl.init = extract_init;
1176 extractCtrl.tokenAdd = extract_token_add;
1177 extractCtrl.schemaAdd = extract_schema_add;
1178 extractCtrl.dh = zh->reg->dh;
1179 for (i = 0; i<256; i++)
1180 extractCtrl.seqno[i] = 0;
1181 extractCtrl.zebra_maps = zh->reg->zebra_maps;
1182 extractCtrl.flagShowRecords = 0;
1183 extractCtrl.match_criteria[0] = '\0';
1184 extractCtrl.handle = handle;
1187 grs_extract_tree(&extractCtrl, n);
1189 if (rec->size[recInfo_delKeys])
1191 struct recKeys delkeys;
1192 struct sortKeys sortkeys;
1194 delkeys.buf_used = rec->size[recInfo_delKeys];
1195 delkeys.buf = rec->info[recInfo_delKeys];
1197 sortkeys.buf_used = rec->size[recInfo_sortKeys];
1198 sortkeys.buf = rec->info[recInfo_sortKeys];
1200 extract_flushSortKeys (zh, rec->sysno, 0, &sortkeys);
1201 extract_flushRecordKeys (zh, rec->sysno, 0, &delkeys);
1203 extract_flushRecordKeys (zh, rec->sysno, 1, &zh->reg->keys);
1204 extract_flushSortKeys (zh, rec->sysno, 1, &zh->reg->sortKeys);
1206 xfree (rec->info[recInfo_delKeys]);
1207 rec->size[recInfo_delKeys] = zh->reg->keys.buf_used;
1208 rec->info[recInfo_delKeys] = zh->reg->keys.buf;
1209 zh->reg->keys.buf = NULL;
1210 zh->reg->keys.buf_max = 0;
1212 xfree (rec->info[recInfo_sortKeys]);
1213 rec->size[recInfo_sortKeys] = zh->reg->sortKeys.buf_used;
1214 rec->info[recInfo_sortKeys] = zh->reg->sortKeys.buf;
1215 zh->reg->sortKeys.buf = NULL;
1216 zh->reg->sortKeys.buf_max = 0;
1221 void extract_flushRecordKeys (ZebraHandle zh, SYSNO sysno,
1222 int cmd, struct recKeys *reckeys)
1224 void *decode_handle = iscz1_start();
1227 ZebraExplainInfo zei = zh->reg->zei;
1229 if (!zh->reg->key_buf)
1231 int mem= 1024*1024* atoi( res_get_def( zh->res, "memmax", "8"));
1234 yaz_log(YLOG_WARN, "Invalid memory setting, using default 8 MB");
1237 /* FIXME: That "8" should be in a default settings include */
1238 /* not hard-coded here! -H */
1239 zh->reg->key_buf = (char**) xmalloc (mem);
1240 zh->reg->ptr_top = mem/sizeof(char*);
1242 zh->reg->key_buf_used = 0;
1243 zh->reg->key_file_no = 0;
1245 zebraExplain_recordCountIncrement (zei, cmd ? 1 : -1);
1247 while (off < reckeys->buf_used)
1249 const char *src = reckeys->buf + off;
1251 char *dst = (char*) &key;
1253 iscz1_decode(decode_handle, &dst, &src);
1254 assert(key.len == 4);
1256 if (zh->reg->key_buf_used + 1024 >
1257 (zh->reg->ptr_top -zh->reg->ptr_i)*sizeof(char*))
1258 extract_flushWriteKeys (zh,0);
1260 assert(zh->reg->ptr_i > 0);
1261 (zh->reg->key_buf)[zh->reg->ptr_top - zh->reg->ptr_i] =
1262 (char*)zh->reg->key_buf + zh->reg->key_buf_used;
1264 ch = (int) key.mem[0]; /* ordinal for field/use/attribute */
1266 zh->reg->key_buf_used +=
1267 key_SU_encode (ch,((char*)zh->reg->key_buf) +
1268 zh->reg->key_buf_used);
1270 ((char*)zh->reg->key_buf) [(zh->reg->key_buf_used)++] = *src++;
1272 ((char*)(zh->reg->key_buf))[(zh->reg->key_buf_used)++] = '\0';
1273 ((char*)(zh->reg->key_buf))[(zh->reg->key_buf_used)++] = cmd;
1276 if (key.mem[1]) /* filter specified record ID */
1277 key.mem[0] = key.mem[1];
1280 key.mem[1] = key.mem[2]; /* section_id */
1281 key.mem[2] = key.mem[3]; /* sequence .. */
1283 memcpy ((char*)zh->reg->key_buf + zh->reg->key_buf_used,
1285 (zh->reg->key_buf_used) += sizeof(key);
1286 off = src - reckeys->buf;
1288 assert (off == reckeys->buf_used);
1289 iscz1_stop(decode_handle);
1292 void extract_flushWriteKeys (ZebraHandle zh, int final)
1293 /* optimizing: if final=1, and no files written yet */
1294 /* push the keys directly to merge, sidestepping the */
1295 /* temp file altogether. Speeds small updates */
1298 char out_fname[200];
1300 struct encode_info encode_info;
1301 int ptr_i = zh->reg->ptr_i;
1306 if (!zh->reg->key_buf || ptr_i <= 0)
1308 yaz_log (YLOG_DEBUG, " nothing to flush section=%d buf=%p i=%d",
1309 zh->reg->key_file_no, zh->reg->key_buf, ptr_i);
1310 yaz_log (YLOG_DEBUG, " buf=%p ",
1312 yaz_log (YLOG_DEBUG, " ptr=%d ",zh->reg->ptr_i);
1313 yaz_log (YLOG_DEBUG, " reg=%p ",zh->reg);
1318 (zh->reg->key_file_no)++;
1319 yaz_log (YLOG_LOG, "sorting section %d", (zh->reg->key_file_no));
1320 yaz_log (YLOG_DEBUG, " sort_buff at %p n=%d",
1321 zh->reg->key_buf + zh->reg->ptr_top - ptr_i,ptr_i);
1323 qsort (zh->reg->key_buf + zh->reg->ptr_top - ptr_i, ptr_i,
1324 sizeof(char*), key_qsort_compare);
1326 /* zebra.cfg: tempfiles:
1327 Y: always use temp files (old way)
1328 A: use temp files, if more than one (auto)
1329 = if this is both the last and the first
1330 N: never bother with temp files (new) */
1332 temp_policy=toupper(res_get_def(zh->res,"tempfiles","auto")[0]);
1333 if (temp_policy != 'Y' && temp_policy != 'N' && temp_policy != 'A') {
1334 yaz_log (YLOG_WARN, "Illegal tempfiles setting '%c'. using 'Auto' ",
1339 if ( ( temp_policy =='N' ) || /* always from memory */
1340 ( ( temp_policy =='A' ) && /* automatic */
1341 (zh->reg->key_file_no == 1) && /* this is first time */
1342 (final) ) ) /* and last (=only) time */
1343 { /* go directly from memory */
1344 zh->reg->key_file_no =0; /* signal not to read files */
1345 zebra_index_merge(zh);
1347 zh->reg->key_buf_used = 0;
1351 /* Not doing directly from memory, write into a temp file */
1352 extract_get_fname_tmp (zh, out_fname, zh->reg->key_file_no);
1354 if (!(outf = fopen (out_fname, "wb")))
1356 yaz_log (YLOG_FATAL|YLOG_ERRNO, "fopen %s", out_fname);
1359 yaz_log (YLOG_LOG, "writing section %d", zh->reg->key_file_no);
1360 prevcp = cp = (zh->reg->key_buf)[zh->reg->ptr_top - ptr_i];
1362 encode_key_init (&encode_info);
1363 encode_key_write (cp, &encode_info, outf);
1367 cp = (zh->reg->key_buf)[zh->reg->ptr_top - ptr_i];
1368 if (strcmp (cp, prevcp))
1370 encode_key_flush ( &encode_info, outf);
1371 encode_key_init (&encode_info);
1372 encode_key_write (cp, &encode_info, outf);
1376 encode_key_write (cp + strlen(cp), &encode_info, outf);
1378 encode_key_flush ( &encode_info, outf);
1380 qsort (key_buf + ptr_top-ptr_i, ptr_i, sizeof(char*), key_x_compare);
1381 extract_get_fname_tmp (out_fname, key_file_no);
1383 if (!(outf = fopen (out_fname, "wb")))
1385 yaz_log (YLOG_FATAL|YLOG_ERRNO, "fopen %s", out_fname);
1388 yaz_log (YLOG_LOG, "writing section %d", key_file_no);
1390 prevcp = key_buf[ptr_top-i];
1392 if (!--i || strcmp (prevcp, key_buf[ptr_top-i]))
1394 key_y_len = strlen(prevcp)+1;
1396 yaz_log (YLOG_LOG, "key_y_len: %2d %02x %02x %s",
1397 key_y_len, prevcp[0], prevcp[1], 2+prevcp);
1399 qsort (key_buf + ptr_top-ptr_i, ptr_i - i,
1400 sizeof(char*), key_y_compare);
1401 cp = key_buf[ptr_top-ptr_i];
1403 encode_key_init (&encode_info);
1404 encode_key_write (cp, &encode_info, outf);
1407 cp = key_buf[ptr_top-ptr_i];
1408 encode_key_write (cp+key_y_len, &encode_info, outf);
1410 encode_key_flush ( &encode_info, outf);
1413 prevcp = key_buf[ptr_top-ptr_i];
1418 yaz_log (YLOG_FATAL|YLOG_ERRNO, "fclose %s", out_fname);
1421 yaz_log (YLOG_LOG, "finished section %d", zh->reg->key_file_no);
1423 zh->reg->key_buf_used = 0;
1426 void extract_add_it_key (ZebraHandle zh,
1428 const char *str, int slen, struct it_key *key)
1431 struct recKeys *keys = &zh->reg->keys;
1432 const char *src = (char*) key;
1434 if (keys->buf_used+1024 > keys->buf_max)
1436 char *b = (char *) xmalloc (keys->buf_max += 128000);
1437 if (keys->buf_used > 0)
1438 memcpy (b, keys->buf, keys->buf_used);
1442 dst = keys->buf + keys->buf_used;
1444 iscz1_encode(keys->codec_handle, &dst, &src);
1447 memcpy (dst, str, slen);
1450 keys->buf_used = dst - keys->buf;
1453 void extract_add_index_string (RecWord *p, const char *str, int length)
1457 ZebraHandle zh = p->extractCtrl->handle;
1458 ZebraExplainInfo zei = zh->reg->zei;
1463 ch = zebraExplain_lookup_attr_str(zei, p->attrStr);
1465 ch = zebraExplain_add_attr_str(zei, p->attrStr);
1469 ch = zebraExplain_lookup_attr_su(zei, p->attrSet, p->attrUse);
1471 ch = zebraExplain_add_attr_su(zei, p->attrSet, p->attrUse);
1475 key.mem[1] = p->record_id;
1476 key.mem[2] = p->section_id;
1477 key.mem[3] = p->seqno;
1480 /* just for debugging .. */
1481 yaz_log(YLOG_LOG, "add: set=%d use=%d "
1482 "record_id=%lld section_id=%lld seqno=%lld",
1483 p->attrSet, p->attrUse, p->record_id, p->section_id, p->seqno);
1486 extract_add_it_key(p->extractCtrl->handle, p->reg_type, str,
1490 static void extract_add_sort_string (RecWord *p, const char *str,
1493 ZebraHandle zh = p->extractCtrl->handle;
1494 struct sortKeys *sk = &zh->reg->sortKeys;
1497 while (off < sk->buf_used)
1501 off += key_SU_decode(&set, sk->buf + off);
1502 off += key_SU_decode(&use, sk->buf + off);
1503 off += key_SU_decode(&slen, sk->buf + off);
1505 if (p->attrSet == set && p->attrUse == use)
1508 assert (off == sk->buf_used);
1510 if (sk->buf_used + IT_MAX_WORD > sk->buf_max)
1514 b = (char *) xmalloc (sk->buf_max += 128000);
1515 if (sk->buf_used > 0)
1516 memcpy (b, sk->buf, sk->buf_used);
1520 off += key_SU_encode(p->attrSet, sk->buf + off);
1521 off += key_SU_encode(p->attrUse, sk->buf + off);
1522 off += key_SU_encode(length, sk->buf + off);
1523 memcpy (sk->buf + off, str, length);
1524 sk->buf_used = off + length;
1527 void extract_add_string (RecWord *p, const char *string, int length)
1529 assert (length > 0);
1530 if (zebra_maps_is_sort (p->zebra_maps, p->reg_type))
1531 extract_add_sort_string (p, string, length);
1533 extract_add_index_string (p, string, length);
1536 static void extract_add_incomplete_field (RecWord *p)
1538 const char *b = p->term_buf;
1539 int remain = p->term_len;
1540 const char **map = 0;
1542 yaz_log(YLOG_DEBUG, "Incomplete field, w='%.*s'", p->term_len, p->term_buf);
1545 map = zebra_maps_input(p->zebra_maps, p->reg_type, &b, remain, 0);
1549 char buf[IT_MAX_WORD+1];
1553 while (map && *map && **map == *CHR_SPACE)
1555 remain = p->term_len - (b - p->term_buf);
1557 map = zebra_maps_input(p->zebra_maps, p->reg_type, &b, remain, 0);
1564 while (map && *map && **map != *CHR_SPACE)
1566 const char *cp = *map;
1568 while (i < IT_MAX_WORD && *cp)
1570 remain = p->term_len - (b - p->term_buf);
1572 map = zebra_maps_input(p->zebra_maps, p->reg_type, &b, remain, 0);
1578 extract_add_string (p, buf, i);
1583 static void extract_add_complete_field (RecWord *p)
1585 const char *b = p->term_buf;
1586 char buf[IT_MAX_WORD+1];
1587 const char **map = 0;
1588 int i = 0, remain = p->term_len;
1590 yaz_log(YLOG_DEBUG, "Complete field, w='%.*s'",
1591 p->term_len, p->term_buf);
1594 map = zebra_maps_input (p->zebra_maps, p->reg_type, &b, remain, 1);
1596 while (remain > 0 && i < IT_MAX_WORD)
1598 while (map && *map && **map == *CHR_SPACE)
1600 remain = p->term_len - (b - p->term_buf);
1604 int first = i ? 0 : 1; /* first position */
1605 map = zebra_maps_input(p->zebra_maps, p->reg_type, &b, remain, first);
1613 if (i && i < IT_MAX_WORD)
1614 buf[i++] = *CHR_SPACE;
1615 while (map && *map && **map != *CHR_SPACE)
1617 const char *cp = *map;
1619 if (**map == *CHR_CUT)
1625 if (i >= IT_MAX_WORD)
1627 yaz_log(YLOG_DEBUG, "Adding string to index '%d'", **map);
1628 while (i < IT_MAX_WORD && *cp)
1631 remain = p->term_len - (b - p->term_buf);
1634 map = zebra_maps_input (p->zebra_maps, p->reg_type, &b,
1643 extract_add_string (p, buf, i);
1646 void extract_token_add (RecWord *p)
1650 yaz_log (YLOG_LOG, "token_add "
1651 "reg_type=%c attrSet=%d attrUse=%d seqno=%d s=%.*s",
1652 p->reg_type, p->attrSet, p->attrUse, p->seqno, p->length,
1655 if ((wrbuf = zebra_replace(p->zebra_maps, p->reg_type, 0,
1656 p->term_buf, p->term_len)))
1658 p->term_buf = wrbuf_buf(wrbuf);
1659 p->term_len = wrbuf_len(wrbuf);
1661 if (zebra_maps_is_complete (p->zebra_maps, p->reg_type))
1662 extract_add_complete_field (p);
1664 extract_add_incomplete_field(p);
1667 void extract_schema_add (struct recExtractCtrl *p, Odr_oid *oid)
1669 ZebraHandle zh = (ZebraHandle) (p->handle);
1670 zebraExplain_addSchema (zh->reg->zei, oid);
1673 void extract_flushSortKeys (ZebraHandle zh, SYSNO sysno,
1674 int cmd, struct sortKeys *sk)
1676 SortIdx sortIdx = zh->reg->sortIdx;
1679 sortIdx_sysno (sortIdx, sysno);
1681 while (off < sk->buf_used)
1685 off += key_SU_decode(&set, sk->buf + off);
1686 off += key_SU_decode(&use, sk->buf + off);
1687 off += key_SU_decode(&slen, sk->buf + off);
1689 sortIdx_type(sortIdx, use);
1691 sortIdx_add(sortIdx, sk->buf + off, slen);
1693 sortIdx_add(sortIdx, "", 1);
1698 void encode_key_init (struct encode_info *i)
1707 i->encode_handle = iscz1_start();
1713 /* this is the old encode_key_write
1714 * may be deleted once we are confident that the new works
1717 void encode_key_write (char *k, struct encode_info *i, FILE *outf)
1720 char *bp = i->buf, *bp0;
1721 const char *src = (char *) &key;
1723 /* copy term to output buf */
1724 while ((*bp++ = *k++))
1726 /* and copy & align key so we can mangle */
1727 memcpy (&key, k+1, sizeof(struct it_key)); /* *k is insert/delete */
1730 iscz1_encode(i->encode_handle, &bp, &src);
1731 *bp0 = (*k * 128) + bp - bp0 - 1; /* length and insert/delete combined */
1732 if (fwrite (i->buf, bp - i->buf, 1, outf) != 1)
1734 yaz_log (YLOG_FATAL|YLOG_ERRNO, "fwrite");
1739 void encode_key_flush (struct encode_info *i, FILE *outf)
1740 { /* dummy routine */
1741 iscz1_stop(i->encode_handle);
1746 /* new encode_key_write
1747 * The idea is to buffer one more key, and compare them
1748 * If we are going to delete and insert the same key,
1749 * we may as well not bother. Should make a difference in
1750 * updates with small modifications (appending to a mbox)
1752 void encode_key_write (char *k, struct encode_info *i, FILE *outf)
1757 if (*k) /* first time for new key */
1760 while ((*bp++ = *k++))
1762 i->keylen= bp - i->buf -1;
1763 assert(i->keylen+1+sizeof(struct it_key) < ENCODE_BUFLEN);
1767 bp=i->buf + i->keylen;
1772 memcpy (&key, k+1, sizeof(struct it_key));
1773 if (0==i->prevsys) /* no previous filter, fill up */
1775 i->prevsys=key.sysno;
1776 i->prevseq=key.seqno;
1779 else if ( (i->prevsys==key.sysno) &&
1780 (i->prevseq==key.seqno) &&
1782 { /* same numbers, diff cmd, they cancel out */
1786 { /* different stuff, write previous, move buf */
1787 bp = encode_key_int ( (i->prevsys - i->sysno) * 2 + i->prevcmd, bp);
1788 if (i->sysno != i->prevsys)
1790 i->sysno = i->prevsys;
1793 else if (!i->seqno && !i->prevseq && i->cmd == i->prevcmd)
1795 return; /* ??? Filters some sort of duplicates away */
1796 /* ??? Can this ever happen -H 15oct02 */
1798 bp = encode_key_int (i->prevseq - i->seqno, bp);
1799 i->seqno = i->prevseq;
1800 i->cmd = i->prevcmd;
1801 if (fwrite (i->buf, bp - i->buf, 1, outf) != 1)
1803 yaz_log (YLOG_FATAL|YLOG_ERRNO, "fwrite");
1806 i->keylen=0; /* ok, it's written, forget it */
1807 i->prevsys=key.sysno;
1808 i->prevseq=key.seqno;
1813 void encode_key_flush (struct encode_info *i, FILE *outf)
1814 { /* flush the last key from i */
1815 char *bp =i->buf + i->keylen;
1818 return; /* nothing to flush */
1821 bp = encode_key_int ( (i->prevsys - i->sysno) * 2 + i->prevcmd, bp);
1822 if (i->sysno != i->prevsys)
1824 i->sysno = i->prevsys;
1827 else if (!i->seqno && !i->prevseq && i->cmd == i->prevcmd)
1829 return; /* ??? Filters some sort of duplicates away */
1830 /* ??? Can this ever happen -H 15oct02 */
1832 bp = encode_key_int (i->prevseq - i->seqno, bp);
1833 i->seqno = i->prevseq;
1834 i->cmd = i->prevcmd;
1835 if (fwrite (i->buf, bp - i->buf, 1, outf) != 1)
1837 yaz_log (YLOG_FATAL|YLOG_ERRNO, "fwrite");
1840 i->keylen=0; /* ok, it's written, forget it */
1841 i->prevsys=0; /* forget the values too */