2 * Copyright (c) 1995-1998, Index Data.
3 * See the file LICENSE for details.
6 * Isamd - isam with diffs
9 * most of it, this is just a copy of isamh
24 #include "../index/index.h" /* for dump */
26 static void flush_block (ISAMD is, int cat);
27 static void release_fc (ISAMD is, int cat);
28 static void init_fc (ISAMD is, int cat);
30 #define ISAMD_FREELIST_CHUNK 1
34 ISAMD_M isamd_getmethod (ISAMD_M me)
36 static struct ISAMD_filecat_s def_cat[] = {
38 /* blocksz, max keys before switching size */
48 /* old values from isamc, long time ago...
57 /* assume about 2 bytes per pointer, when compressed. The head uses */
58 /* 16 bytes, and other blocks use 8 for header info... If you want 3 */
59 /* blocks of 32 bytes, say max 16+24+24 = 64 keys */
62 ISAMD_M m = (ISAMD_M) xmalloc (sizeof(*m));
70 m->compare_item = NULL;
74 m->max_blocks_mem = 10;
81 ISAMD isamd_open (BFiles bfs, const char *name, int writeflag, ISAMD_M method)
84 ISAMD_filecat filecat;
87 is = (ISAMD) xmalloc (sizeof(*is));
89 is->method = (ISAMD_M) xmalloc (sizeof(*is->method));
90 memcpy (is->method, method, sizeof(*method));
91 filecat = is->method->filecat;
94 /* determine number of block categories */
95 if (is->method->debug)
96 logf (LOG_LOG, "isamd: bsize maxkeys");
99 if (is->method->debug)
100 logf (LOG_LOG, "isamd:%6d %6d",
101 filecat[i].bsize, filecat[i].mblocks);
102 } while (filecat[i++].mblocks);
106 assert (is->no_files > 0);
107 is->files = (ISAMD_file) xmalloc (sizeof(*is->files)*is->no_files);
110 /* TODO - what ever needs to be done here... */
116 for (i = 0; i<is->no_files; i++)
120 sprintf (fname, "%s%c", name, i+'A');
121 is->files[i].bf = bf_open (bfs, fname, is->method->filecat[i].bsize,
123 is->files[i].head_is_dirty = 0;
124 if (!bf_read (is->files[i].bf, 0, 0, sizeof(ISAMD_head),
127 is->files[i].head.lastblock = 1;
128 is->files[i].head.freelist = 0;
130 is->files[i].alloc_entries_num = 0;
131 is->files[i].alloc_entries_max =
132 is->method->filecat[i].bsize / sizeof(int) - 1;
133 is->files[i].alloc_buf = (char *)
134 xmalloc (is->method->filecat[i].bsize);
135 is->files[i].no_writes = 0; /* clear statistics */
136 is->files[i].no_reads = 0;
137 is->files[i].no_skip_writes = 0;
138 is->files[i].no_allocated = 0;
139 is->files[i].no_released = 0;
140 is->files[i].no_remap = 0;
141 is->files[i].no_forward = 0;
142 is->files[i].no_backward = 0;
143 is->files[i].sum_forward = 0;
144 is->files[i].sum_backward = 0;
145 is->files[i].no_next = 0;
146 is->files[i].no_prev = 0;
153 int isamd_block_used (ISAMD is, int type)
155 if (type < 0 || type >= is->no_files)
157 return is->files[type].head.lastblock-1;
160 int isamd_block_size (ISAMD is, int type)
162 ISAMD_filecat filecat = is->method->filecat;
163 if (type < 0 || type >= is->no_files)
165 return filecat[type].bsize;
168 int isamd_close (ISAMD is)
172 if (is->method->debug)
174 logf (LOG_LOG, "isamd: next forw mid-f prev backw mid-b");
175 for (i = 0; i<is->no_files; i++)
176 logf (LOG_LOG, "isamd:%8d%8d%8.1f%8d%8d%8.1f",
177 is->files[i].no_next,
178 is->files[i].no_forward,
179 is->files[i].no_forward ?
180 (double) is->files[i].sum_forward/is->files[i].no_forward
182 is->files[i].no_prev,
183 is->files[i].no_backward,
184 is->files[i].no_backward ?
185 (double) is->files[i].sum_backward/is->files[i].no_backward
188 if (is->method->debug)
189 logf (LOG_LOG, "isamd: writes reads skipped alloc released remap");
190 for (i = 0; i<is->no_files; i++)
193 assert (is->files[i].bf);
194 if (is->files[i].head_is_dirty)
195 bf_write (is->files[i].bf, 0, 0, sizeof(ISAMD_head),
197 if (is->method->debug)
198 logf (LOG_LOG, "isamd:%8d%8d%8d%8d%8d%8d",
199 is->files[i].no_writes,
200 is->files[i].no_reads,
201 is->files[i].no_skip_writes,
202 is->files[i].no_allocated,
203 is->files[i].no_released,
204 is->files[i].no_remap);
205 xfree (is->files[i].fc_list);
207 bf_close (is->files[i].bf);
215 int isamd_read_block (ISAMD is, int cat, int pos, char *dst)
217 ++(is->files[cat].no_reads);
218 return bf_read (is->files[cat].bf, pos, 0, 0, dst);
221 int isamd_write_block (ISAMD is, int cat, int pos, char *src)
223 ++(is->files[cat].no_writes);
224 if (is->method->debug > 2)
225 logf (LOG_LOG, "isamd: write_block %d %d", cat, pos);
226 return bf_write (is->files[cat].bf, pos, 0, 0, src);
229 int isamd_write_dblock (ISAMD is, int cat, int pos, char *src,
230 int nextpos, int offset)
232 ISAMD_BLOCK_SIZE size = offset + ISAMD_BLOCK_OFFSET_N;
233 if (is->method->debug > 2)
234 logf (LOG_LOG, "isamd: write_dblock. size=%d nextpos=%d",
235 (int) size, nextpos);
236 src -= ISAMD_BLOCK_OFFSET_N;
237 assert( ISAMD_BLOCK_OFFSET_N == sizeof(int)+sizeof(int) );
238 memcpy (src, &nextpos, sizeof(int));
239 memcpy (src + sizeof(int), &size, sizeof(size));
240 return isamd_write_block (is, cat, pos, src);
243 #if ISAMD_FREELIST_CHUNK
244 static void flush_block (ISAMD is, int cat)
246 char *abuf = is->files[cat].alloc_buf;
247 int block = is->files[cat].head.freelist;
248 if (block && is->files[cat].alloc_entries_num)
250 memcpy (abuf, &is->files[cat].alloc_entries_num, sizeof(int));
251 bf_write (is->files[cat].bf, block, 0, 0, abuf);
252 is->files[cat].alloc_entries_num = 0;
257 static int alloc_block (ISAMD is, int cat)
259 int block = is->files[cat].head.freelist;
260 char *abuf = is->files[cat].alloc_buf;
262 (is->files[cat].no_allocated)++;
266 block = (is->files[cat].head.lastblock)++; /* no free list */
267 is->files[cat].head_is_dirty = 1;
271 if (!is->files[cat].alloc_entries_num) /* read first time */
273 bf_read (is->files[cat].bf, block, 0, 0, abuf);
274 memcpy (&is->files[cat].alloc_entries_num, abuf,
275 sizeof(is->files[cat].alloc_entries_num));
276 assert (is->files[cat].alloc_entries_num > 0);
278 /* have some free blocks now */
279 assert (is->files[cat].alloc_entries_num > 0);
280 is->files[cat].alloc_entries_num--;
281 if (!is->files[cat].alloc_entries_num) /* last one in block? */
283 memcpy (&is->files[cat].head.freelist, abuf + sizeof(int),
285 is->files[cat].head_is_dirty = 1;
287 if (is->files[cat].head.freelist)
289 bf_read (is->files[cat].bf, is->files[cat].head.freelist,
291 memcpy (&is->files[cat].alloc_entries_num, abuf,
292 sizeof(is->files[cat].alloc_entries_num));
293 assert (is->files[cat].alloc_entries_num);
297 memcpy (&block, abuf + sizeof(int) + sizeof(int) *
298 is->files[cat].alloc_entries_num, sizeof(int));
303 static void release_block (ISAMD is, int cat, int pos)
305 char *abuf = is->files[cat].alloc_buf;
306 int block = is->files[cat].head.freelist;
308 (is->files[cat].no_released)++;
310 if (block && !is->files[cat].alloc_entries_num) /* must read block */
312 bf_read (is->files[cat].bf, block, 0, 0, abuf);
313 memcpy (&is->files[cat].alloc_entries_num, abuf,
314 sizeof(is->files[cat].alloc_entries_num));
315 assert (is->files[cat].alloc_entries_num > 0);
317 assert (is->files[cat].alloc_entries_num <= is->files[cat].alloc_entries_max);
318 if (is->files[cat].alloc_entries_num == is->files[cat].alloc_entries_max)
321 memcpy (abuf, &is->files[cat].alloc_entries_num, sizeof(int));
322 bf_write (is->files[cat].bf, block, 0, 0, abuf);
323 is->files[cat].alloc_entries_num = 0;
325 if (!is->files[cat].alloc_entries_num) /* make new buffer? */
327 memcpy (abuf + sizeof(int), &block, sizeof(int));
328 is->files[cat].head.freelist = pos;
329 is->files[cat].head_is_dirty = 1;
333 memcpy (abuf + sizeof(int) +
334 is->files[cat].alloc_entries_num*sizeof(int),
337 is->files[cat].alloc_entries_num++;
340 static void flush_block (ISAMD is, int cat)
342 char *abuf = is->files[cat].alloc_buf;
346 static int alloc_block (ISAMD is, int cat)
349 char buf[sizeof(int)];
351 is->files[cat].head_is_dirty = 1;
352 (is->files[cat].no_allocated)++;
353 if ((block = is->files[cat].head.freelist))
355 bf_read (is->files[cat].bf, block, 0, sizeof(int), buf);
356 memcpy (&is->files[cat].head.freelist, buf, sizeof(int));
359 block = (is->files[cat].head.lastblock)++;
363 static void release_block (ISAMD is, int cat, int pos)
365 char buf[sizeof(int)];
367 (is->files[cat].no_released)++;
368 is->files[cat].head_is_dirty = 1;
369 memcpy (buf, &is->files[cat].head.freelist, sizeof(int));
370 is->files[cat].head.freelist = pos;
371 bf_write (is->files[cat].bf, pos, 0, sizeof(int), buf);
375 int isamd_alloc_block (ISAMD is, int cat)
379 if (is->files[cat].fc_list)
382 for (j = 0; j < is->files[cat].fc_max; j++)
383 if ((nb = is->files[cat].fc_list[j]) && (!block || nb < block))
385 is->files[cat].fc_list[j] = 0;
391 block = alloc_block (is, cat);
392 if (is->method->debug > 3)
393 logf (LOG_LOG, "isamd: alloc_block in cat %d: %d", cat, block);
397 void isamd_release_block (ISAMD is, int cat, int pos)
399 if (is->method->debug > 3)
400 logf (LOG_LOG, "isamd: release_block in cat %d: %d", cat, pos);
401 if (is->files[cat].fc_list)
404 for (j = 0; j<is->files[cat].fc_max; j++)
405 if (!is->files[cat].fc_list[j])
407 is->files[cat].fc_list[j] = pos;
411 release_block (is, cat, pos);
414 static void init_fc (ISAMD is, int cat)
418 is->files[cat].fc_max = j;
419 is->files[cat].fc_list = (int *)
420 xmalloc (sizeof(*is->files[0].fc_list) * j);
422 is->files[cat].fc_list[j] = 0;
425 static void release_fc (ISAMD is, int cat)
427 int b, j = is->files[cat].fc_max;
430 if ((b = is->files[cat].fc_list[j]))
432 release_block (is, cat, b);
433 is->files[cat].fc_list[j] = 0;
437 void isamd_pp_close (ISAMD_PP pp)
441 (*is->method->code_stop)(ISAMD_DECODE, pp->decodeClientData);
446 ISAMD_PP isamd_pp_open (ISAMD is, ISAMD_P ipos)
448 ISAMD_PP pp = (ISAMD_PP) xmalloc (sizeof(*pp));
451 pp->cat = isamd_type(ipos);
452 pp->pos = isamd_block(ipos);
454 src = pp->buf = (char *) xmalloc (is->method->filecat[pp->cat].bsize);
460 pp->decodeClientData = (*is->method->code_start)(ISAMD_DECODE);
461 //pp->deleteFlag = 0;
468 isamd_read_block (is, pp->cat, pp->pos, src);
469 memcpy (&pp->next, src, sizeof(pp->next));
470 src += sizeof(pp->next);
471 memcpy (&pp->size, src, sizeof(pp->size));
472 src += sizeof(pp->size);
473 memcpy (&pp->numKeys, src, sizeof(pp->numKeys));
474 src += sizeof(pp->numKeys);
475 memcpy (&pp->diffs, src, sizeof(pp->diffs));
476 src += sizeof(pp->diffs);
477 assert (pp->next != pp->pos);
478 pp->offset = src - pp->buf;
479 assert (pp->offset == ISAMD_BLOCK_OFFSET_1);
480 if (is->method->debug > 2)
481 logf (LOG_LOG, "isamd_pp_open sz=%d c=%d p=%d n=%d",
482 pp->size, pp->cat, pp->pos, isamd_block(pp->next));
489 void isamd_buildfirstblock(ISAMD_PP pp){
492 assert(pp->next != pp->pos);
493 memcpy(dst, &pp->next, sizeof(pp->next) );
494 dst += sizeof(pp->next);
495 memcpy(dst, &pp->size,sizeof(pp->size));
496 dst += sizeof(pp->size);
497 memcpy(dst, &pp->numKeys, sizeof(pp->numKeys));
498 dst += sizeof(pp->numKeys);
499 memcpy(dst, &pp->diffs, sizeof(pp->diffs));
500 dst += sizeof(pp->diffs);
501 assert (dst - pp->buf == ISAMD_BLOCK_OFFSET_1);
502 if (pp->is->method->debug > 2)
503 logf (LOG_LOG, "isamd: first: sz=%d p=%d/%d>%d/%d nk=%d d=%d",
506 isamd_type(pp->next), isamd_block(pp->next),
507 pp->numKeys, pp->diffs);
510 void isamd_buildlaterblock(ISAMD_PP pp){
513 assert(pp->next != isamd_addr(pp->pos,pp->cat));
514 memcpy(dst, &pp->next, sizeof(pp->next) );
515 dst += sizeof(pp->next);
516 memcpy(dst, &pp->size,sizeof(pp->size));
517 dst += sizeof(pp->size);
518 assert (dst - pp->buf == ISAMD_BLOCK_OFFSET_N);
519 if (pp->is->method->debug > 2)
520 logf (LOG_LOG, "isamd: l8r: sz=%d p=%d/%d>%d/%d",
523 isamd_block(pp->next), isamd_type(pp->next) );
528 /* returns non-zero if item could be read; 0 otherwise */
529 int isamd_pp_read (ISAMD_PP pp, void *buf)
531 return isamd_read_item (pp, (char **) &buf);
534 /* read one item from file - decode and store it in *dst.
537 1 if item could be read ok and NO boundary
538 2 if item could be read ok and boundary */
539 int isamd_read_item (ISAMD_PP pp, char **dst)
542 char *src = pp->buf + pp->offset;
545 if (pp->offset >= pp->size)
550 return 0; /* end of file */
552 if (pp->next > pp->pos)
554 if (pp->next == pp->pos + 1)
555 is->files[pp->cat].no_next++;
558 is->files[pp->cat].no_forward++;
559 is->files[pp->cat].sum_forward += pp->next - pp->pos;
564 if (pp->next + 1 == pp->pos)
565 is->files[pp->cat].no_prev++;
568 is->files[pp->cat].no_backward++;
569 is->files[pp->cat].sum_backward += pp->pos - pp->next;
572 /* out new block position */
573 newcat = isamd_type(pp->next);
574 if (pp->cat != newcat ) {
575 pp->buf = xrealloc(pp->buf, is->method->filecat[newcat].bsize);
577 pp->pos = isamd_block(pp->next);
578 pp->cat = isamd_type(pp->next);
581 /* read block and save 'next' and 'size' entry */
582 isamd_read_block (is, pp->cat, pp->pos, src);
583 memcpy (&pp->next, src, sizeof(pp->next));
584 src += sizeof(pp->next);
585 memcpy (&pp->size, src, sizeof(pp->size));
586 src += sizeof(pp->size);
587 /* assume block is non-empty */
588 assert (src - pp->buf == ISAMD_BLOCK_OFFSET_N);
589 assert (pp->next != isamd_addr(pp->pos,pp->cat));
590 //if (pp->deleteFlag)
591 // isamd_release_block (is, pp->cat, pp->pos);
592 (*is->method->code_reset)(pp->decodeClientData);
593 (*is->method->code_item)(ISAMD_DECODE, pp->decodeClientData, dst, &src);
594 pp->offset = src - pp->buf;
595 if (is->method->debug > 2)
596 logf (LOG_LOG, "isamd: read_block size=%d %d %d next=%d",
597 pp->size, pp->cat, pp->pos, pp->next);
600 (*is->method->code_item)(ISAMD_DECODE, pp->decodeClientData, dst, &src);
601 pp->offset = src - pp->buf;
605 int isamd_pp_num (ISAMD_PP pp)
610 static char *hexdump(unsigned char *p, int len, char *buff) {
611 static char localbuff[128];
613 if (!buff) buff=localbuff;
616 sprintf(bytebuff,"%02x",*p);
618 strcat(buff,bytebuff);
619 if (len) strcat(buff," ");
625 void isamd_pp_dump (ISAMD is, ISAMD_P ipos)
635 logf(LOG_LOG,"dumping isamd block %d (%d:%d)",
636 (int)ipos, isamd_type(ipos), isamd_block(ipos) );
637 pp=isamd_pp_open(is,ipos);
638 logf(LOG_LOG,"numKeys=%d, ofs=%d d=%d",
640 pp->offset, pp->diffs);
642 while(isamd_pp_read(pp, &key))
644 if (oldaddr != isamd_addr(pp->pos,pp->cat) )
646 oldaddr = isamd_addr(pp->pos,pp->cat);
647 logf(LOG_LOG,"block %d (%d:%d) sz=%d nx=%d (%d:%d) ofs=%d",
648 isamd_addr(pp->pos,pp->cat),
649 pp->cat, pp->pos, pp->size,
650 pp->next, isamd_type(pp->next), isamd_block(pp->next),
656 logf(LOG_LOG," %05x: %s",i,hexdump(pp->buf+i,n,hexbuff));
659 if (oldoffs > ISAMD_BLOCK_OFFSET_N)
660 oldoffs=ISAMD_BLOCK_OFFSET_N;
663 logf (LOG_LOG," got %d:%d=%x:%x from %s at %d=%x",
664 key.sysno, key.seqno,
665 key.sysno, key.seqno,
666 hexdump(pp->buf+oldoffs, pp->offset-oldoffs, hexbuff),
668 oldoffs = pp->offset;
670 /*!*/ /*TODO: dump diffs too!!! */
676 * Revision 1.2 1999-07-14 15:05:30 heikki
677 * slow start on isam-d
679 * Revision 1.1 1999/07/14 12:34:43 heikki
680 * Copied from isamh, starting to change things...