2 * Copyright (c) 1995-1998, Index Data.
3 * See the file LICENSE for details.
6 * Isamd - isam with diffs
8 * todo: Move read_pp into merge-d
22 #include "../index/index.h" /* isamd uses the internal structure of it_key */
25 static void flush_block (ISAMD is, int cat);
26 static void release_fc (ISAMD is, int cat);
27 static void init_fc (ISAMD is, int cat);
29 #define ISAMD_FREELIST_CHUNK 1
33 ISAMD_M isamd_getmethod (ISAMD_M me)
35 static struct ISAMD_filecat_s def_cat[] = {
37 /* blocksz, max keys before switching size. Unused time being */
50 /* old values from isamc, long time ago...
59 /* assume about 2 bytes per pointer, when compressed. The head uses */
60 /* 16 bytes, and other blocks use 8 for header info... If you want 3 */
61 /* blocks of 32 bytes, say max 16+24+24 = 64 keys */
64 ISAMD_M m = (ISAMD_M) xmalloc (sizeof(*m));
72 m->compare_item = NULL;
76 m->max_blocks_mem = 10;
83 ISAMD isamd_open (BFiles bfs, const char *name, int writeflag, ISAMD_M method)
86 ISAMD_filecat filecat;
89 is = (ISAMD) xmalloc (sizeof(*is));
91 is->method = (ISAMD_M) xmalloc (sizeof(*is->method));
92 memcpy (is->method, method, sizeof(*method));
93 filecat = is->method->filecat;
96 /* determine number of block categories */
97 if (is->method->debug)
98 logf (LOG_LOG, "isamd: bsize maxkeys");
101 if (is->method->debug)
102 logf (LOG_LOG, "isamd:%6d %6d",
103 filecat[i].bsize, filecat[i].mblocks);
104 } while (filecat[i++].mblocks);
108 assert (is->no_files > 0);
109 assert (is->max_cat <=8 ); /* we have only 3 bits for it */
111 is->files = (ISAMD_file) xmalloc (sizeof(*is->files)*is->no_files);
114 /* TODO - what ever needs to be done here... */
120 for (i = 0; i<is->no_files; i++)
124 sprintf (fname, "%s%c", name, i+'A');
125 is->files[i].bf = bf_open (bfs, fname, is->method->filecat[i].bsize,
127 is->files[i].head_is_dirty = 0;
128 if (!bf_read (is->files[i].bf, 0, 0, sizeof(ISAMD_head),
131 is->files[i].head.lastblock = 1;
132 is->files[i].head.freelist = 0;
134 is->files[i].alloc_entries_num = 0;
135 is->files[i].alloc_entries_max =
136 is->method->filecat[i].bsize / sizeof(int) - 1;
137 is->files[i].alloc_buf = (char *)
138 xmalloc (is->method->filecat[i].bsize);
139 is->files[i].no_writes = 0; /* clear statistics */
140 is->files[i].no_reads = 0;
141 is->files[i].no_skip_writes = 0;
142 is->files[i].no_allocated = 0;
143 is->files[i].no_released = 0;
144 is->files[i].no_remap = 0;
145 is->files[i].no_forward = 0;
146 is->files[i].no_backward = 0;
147 is->files[i].sum_forward = 0;
148 is->files[i].sum_backward = 0;
149 is->files[i].no_next = 0;
150 is->files[i].no_prev = 0;
157 int isamd_block_used (ISAMD is, int type)
159 if (type < 0 || type >= is->no_files)
161 return is->files[type].head.lastblock-1;
164 int isamd_block_size (ISAMD is, int type)
166 ISAMD_filecat filecat = is->method->filecat;
167 if (type < 0 || type >= is->no_files)
169 return filecat[type].bsize;
172 int isamd_close (ISAMD is)
176 if (is->method->debug)
178 logf (LOG_LOG, "isamd: next forw mid-f prev backw mid-b");
179 for (i = 0; i<is->no_files; i++)
180 logf (LOG_LOG, "isamd:%8d%8d%8.1f%8d%8d%8.1f",
181 is->files[i].no_next,
182 is->files[i].no_forward,
183 is->files[i].no_forward ?
184 (double) is->files[i].sum_forward/is->files[i].no_forward
186 is->files[i].no_prev,
187 is->files[i].no_backward,
188 is->files[i].no_backward ?
189 (double) is->files[i].sum_backward/is->files[i].no_backward
192 if (is->method->debug)
193 logf (LOG_LOG, "isamd: writes reads skipped alloc released remap");
194 for (i = 0; i<is->no_files; i++)
197 assert (is->files[i].bf);
198 if (is->files[i].head_is_dirty)
199 bf_write (is->files[i].bf, 0, 0, sizeof(ISAMD_head),
201 if (is->method->debug)
202 logf (LOG_LOG, "isamd:%8d%8d%8d%8d%8d%8d",
203 is->files[i].no_writes,
204 is->files[i].no_reads,
205 is->files[i].no_skip_writes,
206 is->files[i].no_allocated,
207 is->files[i].no_released,
208 is->files[i].no_remap);
209 xfree (is->files[i].fc_list);
211 bf_close (is->files[i].bf);
219 int isamd_read_block (ISAMD is, int cat, int pos, char *dst)
221 ++(is->files[cat].no_reads);
222 return bf_read (is->files[cat].bf, pos, 0, 0, dst);
225 int isamd_write_block (ISAMD is, int cat, int pos, char *src)
227 ++(is->files[cat].no_writes);
228 if (is->method->debug > 2)
229 logf (LOG_LOG, "isamd: write_block %d %d", cat, pos);
230 return bf_write (is->files[cat].bf, pos, 0, 0, src);
233 int isamd_write_dblock (ISAMD is, int cat, int pos, char *src,
234 int nextpos, int offset)
236 ISAMD_BLOCK_SIZE size = offset + ISAMD_BLOCK_OFFSET_N;
237 if (is->method->debug > 2)
238 logf (LOG_LOG, "isamd: write_dblock. size=%d nextpos=%d",
239 (int) size, nextpos);
240 src -= ISAMD_BLOCK_OFFSET_N;
241 assert( ISAMD_BLOCK_OFFSET_N == sizeof(int)+sizeof(int) );
242 memcpy (src, &nextpos, sizeof(int));
243 memcpy (src + sizeof(int), &size, sizeof(size));
244 return isamd_write_block (is, cat, pos, src);
247 #if ISAMD_FREELIST_CHUNK
248 static void flush_block (ISAMD is, int cat)
250 char *abuf = is->files[cat].alloc_buf;
251 int block = is->files[cat].head.freelist;
252 if (block && is->files[cat].alloc_entries_num)
254 memcpy (abuf, &is->files[cat].alloc_entries_num, sizeof(int));
255 bf_write (is->files[cat].bf, block, 0, 0, abuf);
256 is->files[cat].alloc_entries_num = 0;
261 static int alloc_block (ISAMD is, int cat)
263 int block = is->files[cat].head.freelist;
264 char *abuf = is->files[cat].alloc_buf;
266 (is->files[cat].no_allocated)++;
270 block = (is->files[cat].head.lastblock)++; /* no free list */
271 is->files[cat].head_is_dirty = 1;
275 if (!is->files[cat].alloc_entries_num) /* read first time */
277 bf_read (is->files[cat].bf, block, 0, 0, abuf);
278 memcpy (&is->files[cat].alloc_entries_num, abuf,
279 sizeof(is->files[cat].alloc_entries_num));
280 assert (is->files[cat].alloc_entries_num > 0);
282 /* have some free blocks now */
283 assert (is->files[cat].alloc_entries_num > 0);
284 is->files[cat].alloc_entries_num--;
285 if (!is->files[cat].alloc_entries_num) /* last one in block? */
287 memcpy (&is->files[cat].head.freelist, abuf + sizeof(int),
289 is->files[cat].head_is_dirty = 1;
291 if (is->files[cat].head.freelist)
293 bf_read (is->files[cat].bf, is->files[cat].head.freelist,
295 memcpy (&is->files[cat].alloc_entries_num, abuf,
296 sizeof(is->files[cat].alloc_entries_num));
297 assert (is->files[cat].alloc_entries_num);
301 memcpy (&block, abuf + sizeof(int) + sizeof(int) *
302 is->files[cat].alloc_entries_num, sizeof(int));
307 static void release_block (ISAMD is, int cat, int pos)
309 char *abuf = is->files[cat].alloc_buf;
310 int block = is->files[cat].head.freelist;
312 (is->files[cat].no_released)++;
314 if (block && !is->files[cat].alloc_entries_num) /* must read block */
316 bf_read (is->files[cat].bf, block, 0, 0, abuf);
317 memcpy (&is->files[cat].alloc_entries_num, abuf,
318 sizeof(is->files[cat].alloc_entries_num));
319 assert (is->files[cat].alloc_entries_num > 0);
321 assert (is->files[cat].alloc_entries_num <= is->files[cat].alloc_entries_max);
322 if (is->files[cat].alloc_entries_num == is->files[cat].alloc_entries_max)
325 memcpy (abuf, &is->files[cat].alloc_entries_num, sizeof(int));
326 bf_write (is->files[cat].bf, block, 0, 0, abuf);
327 is->files[cat].alloc_entries_num = 0;
329 if (!is->files[cat].alloc_entries_num) /* make new buffer? */
331 memcpy (abuf + sizeof(int), &block, sizeof(int));
332 is->files[cat].head.freelist = pos;
333 is->files[cat].head_is_dirty = 1;
337 memcpy (abuf + sizeof(int) +
338 is->files[cat].alloc_entries_num*sizeof(int),
341 is->files[cat].alloc_entries_num++;
344 static void flush_block (ISAMD is, int cat)
346 char *abuf = is->files[cat].alloc_buf;
350 static int alloc_block (ISAMD is, int cat)
353 char buf[sizeof(int)];
355 is->files[cat].head_is_dirty = 1;
356 (is->files[cat].no_allocated)++;
357 if ((block = is->files[cat].head.freelist))
359 bf_read (is->files[cat].bf, block, 0, sizeof(int), buf);
360 memcpy (&is->files[cat].head.freelist, buf, sizeof(int));
363 block = (is->files[cat].head.lastblock)++;
367 static void release_block (ISAMD is, int cat, int pos)
369 char buf[sizeof(int)];
371 (is->files[cat].no_released)++;
372 is->files[cat].head_is_dirty = 1;
373 memcpy (buf, &is->files[cat].head.freelist, sizeof(int));
374 is->files[cat].head.freelist = pos;
375 bf_write (is->files[cat].bf, pos, 0, sizeof(int), buf);
379 int isamd_alloc_block (ISAMD is, int cat)
383 if (is->files[cat].fc_list)
386 for (j = 0; j < is->files[cat].fc_max; j++)
387 if ((nb = is->files[cat].fc_list[j]) && (!block || nb < block))
389 is->files[cat].fc_list[j] = 0;
395 block = alloc_block (is, cat);
396 if (is->method->debug > 3)
397 logf (LOG_LOG, "isamd: alloc_block in cat %d: %d", cat, block);
401 void isamd_release_block (ISAMD is, int cat, int pos)
403 if (is->method->debug > 3)
404 logf (LOG_LOG, "isamd: release_block in cat %d: %d", cat, pos);
407 if (is->files[cat].fc_list)
410 for (j = 0; j<is->files[cat].fc_max; j++)
411 if (!is->files[cat].fc_list[j])
413 is->files[cat].fc_list[j] = pos;
417 release_block (is, cat, pos);
420 static void init_fc (ISAMD is, int cat)
424 is->files[cat].fc_max = j;
425 is->files[cat].fc_list = (int *)
426 xmalloc (sizeof(*is->files[0].fc_list) * j);
428 is->files[cat].fc_list[j] = 0;
431 static void release_fc (ISAMD is, int cat)
433 int b, j = is->files[cat].fc_max;
436 if ((b = is->files[cat].fc_list[j]))
438 release_block (is, cat, b);
439 is->files[cat].fc_list[j] = 0;
443 void isamd_pp_close (ISAMD_PP pp)
447 (*is->method->code_stop)(ISAMD_DECODE, pp->decodeClientData);
448 isamd_free_diffs(pp); /* see merge-d.h */
455 ISAMD_PP isamd_pp_open (ISAMD is, ISAMD_P ipos)
457 ISAMD_PP pp = (ISAMD_PP) xmalloc (sizeof(*pp));
460 pp->cat = isamd_type(ipos);
461 pp->pos = isamd_block(ipos);
463 src = pp->buf = (char *) xmalloc (is->method->filecat[is->max_cat].bsize);
464 /* always allocate for the largest blocks, saves trouble */
465 memset(pp->buf,'\0',is->method->filecat[is->max_cat].bsize);
470 pp->decodeClientData = (*is->method->code_start)(ISAMD_DECODE);
471 //pp->deleteFlag = 0;
481 isamd_read_block (is, pp->cat, pp->pos, src);
482 memcpy (&pp->next, src, sizeof(pp->next));
483 src += sizeof(pp->next);
484 memcpy (&pp->size, src, sizeof(pp->size));
485 src += sizeof(pp->size);
486 memcpy (&pp->numKeys, src, sizeof(pp->numKeys));
487 src += sizeof(pp->numKeys);
488 memcpy (&pp->diffs, src, sizeof(pp->diffs));
489 src += sizeof(pp->diffs);
490 assert (pp->next != pp->pos);
491 pp->offset = src - pp->buf;
492 assert (pp->offset == ISAMD_BLOCK_OFFSET_1);
493 if (is->method->debug > 2)
494 logf (LOG_LOG, "isamd_pp_open sz=%d c=%d p=%d n=%d",
495 pp->size, pp->cat, pp->pos, isamd_block(pp->next));
503 void isamd_buildfirstblock(ISAMD_PP pp){
506 assert(pp->next != pp->pos);
507 memcpy(dst, &pp->next, sizeof(pp->next) );
508 dst += sizeof(pp->next);
509 memcpy(dst, &pp->size,sizeof(pp->size));
510 dst += sizeof(pp->size);
511 memcpy(dst, &pp->numKeys, sizeof(pp->numKeys));
512 dst += sizeof(pp->numKeys);
513 memcpy(dst, &pp->diffs, sizeof(pp->diffs));
514 dst += sizeof(pp->diffs);
515 assert (dst - pp->buf == ISAMD_BLOCK_OFFSET_1);
516 if (pp->is->method->debug > 1) //!!! 2
517 logf (LOG_LOG, "isamd: 1st: sz=%d p=%d:%d>%d:%d nk=%d d=%d=2*%d+%d",
520 isamd_type(pp->next), isamd_block(pp->next),
522 pp->diffs, pp->diffs/2, pp->diffs&1);
525 void isamd_buildlaterblock(ISAMD_PP pp){
528 assert(pp->next != isamd_addr(pp->pos,pp->cat));
529 memcpy(dst, &pp->next, sizeof(pp->next) );
530 dst += sizeof(pp->next);
531 memcpy(dst, &pp->size,sizeof(pp->size));
532 dst += sizeof(pp->size);
533 assert (dst - pp->buf == ISAMD_BLOCK_OFFSET_N);
534 if (pp->is->method->debug > 1) //!!! 2
535 logf (LOG_LOG, "isamd: l8r: sz=%d p=%d/%d>%d/%d",
538 isamd_block(pp->next), isamd_type(pp->next) );
543 /* returns non-zero if item could be read; 0 otherwise */
544 int isamd_pp_read (ISAMD_PP pp, void *buf)
546 return isamd_read_item (pp, (char **) &buf);
547 /* note: isamd_read_item is in merge-d.c, because it is so */
548 /* convoluted with the merge process */
551 /* read one main item from file - decode and store it in *dst.
552 Does not worry about diffs
555 1 if item could be read ok
557 int isamd_read_main_item (ISAMD_PP pp, char **dst)
560 char *src = pp->buf + pp->offset;
563 if (pp->offset >= pp->size)
568 return 0; /* end of file */
570 if (pp->next > pp->pos)
572 if (pp->next == pp->pos + 1)
573 is->files[pp->cat].no_next++;
576 is->files[pp->cat].no_forward++;
577 is->files[pp->cat].sum_forward += pp->next - pp->pos;
582 if (pp->next + 1 == pp->pos)
583 is->files[pp->cat].no_prev++;
586 is->files[pp->cat].no_backward++;
587 is->files[pp->cat].sum_backward += pp->pos - pp->next;
590 /* out new block position */
591 newcat = isamd_type(pp->next);
592 pp->pos = isamd_block(pp->next);
593 pp->cat = isamd_type(pp->next);
596 /* read block and save 'next' and 'size' entry */
597 isamd_read_block (is, pp->cat, pp->pos, src);
598 memcpy (&pp->next, src, sizeof(pp->next));
599 src += sizeof(pp->next);
600 memcpy (&pp->size, src, sizeof(pp->size));
601 src += sizeof(pp->size);
602 /* assume block is non-empty */
603 assert (src - pp->buf == ISAMD_BLOCK_OFFSET_N);
604 assert (pp->next != isamd_addr(pp->pos,pp->cat));
605 //if (pp->deleteFlag)
606 // isamd_release_block (is, pp->cat, pp->pos);
607 (*is->method->code_reset)(pp->decodeClientData);
608 (*is->method->code_item)(ISAMD_DECODE, pp->decodeClientData, dst, &src);
609 pp->offset = src - pp->buf;
610 if (is->method->debug > 2)
611 logf (LOG_LOG, "isamd: read_block size=%d %d %d next=%d",
612 pp->size, pp->cat, pp->pos, pp->next);
615 (*is->method->code_item)(ISAMD_DECODE, pp->decodeClientData, dst, &src);
616 pp->offset = src - pp->buf;
620 int isamd_pp_num (ISAMD_PP pp)
625 static char *hexdump(unsigned char *p, int len, char *buff) {
626 static char localbuff[128];
628 if (!buff) buff=localbuff;
631 sprintf(bytebuff,"%02x",*p);
633 strcat(buff,bytebuff);
634 if (len) strcat(buff," ");
640 void isamd_pp_dump (ISAMD is, ISAMD_P ipos)
650 logf(LOG_LOG,"dumping isamd block %d (%d:%d)",
651 (int)ipos, isamd_type(ipos), isamd_block(ipos) );
652 pp=isamd_pp_open(is,ipos);
653 logf(LOG_LOG,"numKeys=%d, ofs=%d d=%d",
655 pp->offset, pp->diffs);
657 while(isamd_pp_read(pp, &key))
659 if (oldaddr != isamd_addr(pp->pos,pp->cat) )
661 oldaddr = isamd_addr(pp->pos,pp->cat);
662 logf(LOG_LOG,"block %d (%d:%d) sz=%d nx=%d (%d:%d) ofs=%d",
663 isamd_addr(pp->pos,pp->cat),
664 pp->cat, pp->pos, pp->size,
665 pp->next, isamd_type(pp->next), isamd_block(pp->next),
671 logf(LOG_LOG," %05x: %s",i,hexdump(pp->buf+i,n,hexbuff));
674 if (oldoffs > ISAMD_BLOCK_OFFSET_N)
675 oldoffs=ISAMD_BLOCK_OFFSET_N;
678 logf (LOG_LOG," got %d:%d=%x:%x from %s at %d=%x",
679 key.sysno, key.seqno,
680 key.sysno, key.seqno,
681 hexdump(pp->buf+oldoffs, pp->offset-oldoffs, hexbuff),
683 oldoffs = pp->offset;
685 /*!*/ /*TODO: dump diffs too!!! */
691 * Revision 1.5 1999-08-07 11:30:59 heikki
692 * Bug fixing (still a mem leak somewhere)
694 * Revision 1.4 1999/08/04 14:21:18 heikki
695 * isam-d seems to be working.
697 * Revision 1.3 1999/07/21 14:24:50 heikki
698 * isamd write and read functions ok, except when diff block full.
699 * (merge not yet done)
701 * Revision 1.1 1999/07/14 12:34:43 heikki
702 * Copied from isamh, starting to change things...