2 * Copyright (C) 1994-1995, Index Data I/S
4 * Sebastian Hammer, Adam Dickmeiss
7 * Revision 1.6 1995-09-08 14:52:27 adam
8 * Minor changes. Dictionary is lower case now.
10 * Revision 1.5 1995/09/06 16:11:16 adam
11 * Option: only one word key per file.
13 * Revision 1.4 1995/09/05 15:28:39 adam
14 * More work on search engine.
16 * Revision 1.3 1995/09/04 12:33:41 adam
17 * Various cleanup. YAZ util used instead.
19 * Revision 1.2 1995/09/04 09:10:34 adam
20 * More work on index add/del/update.
21 * Merge sort implemented.
22 * Initial work on z39 server.
24 * Revision 1.1 1995/09/01 14:06:35 adam
25 * Split of work into more files.
37 #define KEY_BUF_SIZE 100000
40 static SYSNO sysno_next;
41 static int key_fd = -1;
42 static int sys_idx_fd = -1;
44 static int key_offset;
46 void key_open (const char *fname)
51 if ((key_fd = open (fname, O_RDWR|O_CREAT, 0666)) == -1)
53 logf (LOG_FATAL|LOG_ERRNO, "open %s", fname);
56 logf (LOG_DEBUG, "key_open of %s", fname);
57 if (!(key_buf = malloc (KEY_BUF_SIZE)))
59 logf (LOG_FATAL|LOG_ERRNO, "malloc");
63 if (!(file_idx = dict_open (FNAME_FILE_DICT, 40, 1)))
65 logf (LOG_FATAL, "dict_open fail of %s", "fileidx");
68 file_key = dict_lookup (file_idx, ".");
70 memcpy (&sysno_next, (char*)file_key+1, sizeof(sysno_next));
73 if ((sys_idx_fd = open (FNAME_SYS_IDX, O_RDWR|O_CREAT, 0666)) == -1)
75 logf (LOG_FATAL|LOG_ERRNO, "open %s", FNAME_SYS_IDX);
84 logf (LOG_DEBUG, "key_close - but no file");
89 dict_insert (file_idx, ".", sizeof(sysno_next), &sysno_next);
90 dict_close (file_idx);
92 logf (LOG_DEBUG, "key close - key file exist");
103 while (i < key_offset)
105 w = write (key_fd, key_buf + i, key_offset - i);
108 logf (LOG_FATAL|LOG_ERRNO, "Write key fail");
116 void key_write (int cmd, struct it_key *k, const char *str)
119 size_t slen = strlen(str);
121 if (key_offset + sizeof(*k) + slen >= KEY_BUF_SIZE - 2)
123 x = (cmd == 'a') ? 1 : 0;
124 memcpy (key_buf + key_offset, str, slen+1);
125 key_offset += slen+1;
126 memcpy (key_buf + key_offset, &x, 1);
128 memcpy (key_buf + key_offset, k, sizeof(*k));
129 key_offset += sizeof(*k);
132 void key_write_x (struct strtab *t, int cmd, struct it_key *k, const char *str)
136 if (strtab_src (t, str, &oldinfo))
137 ((struct it_key *) *oldinfo)->seqno++;
140 *oldinfo = xmalloc (sizeof(*k));
141 memcpy (*oldinfo, k, sizeof(*k));
142 ((struct it_key *) *oldinfo)->seqno = 1;
146 void key_rec_flush (const char *str, void *info, void *data)
148 key_write (*((int*) data), (struct it_key *)info, str);
152 void text_extract (struct strtab *t, SYSNO sysno, int cmd, const char *fname)
160 logf (LOG_DEBUG, "Text extract of %d", sysno);
162 inf = fopen (fname, "r");
165 logf (LOG_WARN|LOG_ERRNO, "open %s", fname);
168 while ((c=getc (inf)) != EOF)
171 while (i < 254 && c != EOF && isalnum(c))
173 w[i++] = index_char_cvt (c);
181 #if IT_KEY_HAVE_FIELD
184 key_write_x (t, cmd, &k, w);
192 void file_extract (int cmd, const char *fname, const char *kname)
198 const char *file_type;
202 logf (LOG_DEBUG, "%c %s k=%s", cmd, fname, kname);
203 for (i = strlen(fname); --i >= 0; )
209 else if (fname[i] == '.')
211 strcpy (ext, fname+i+1);
214 sprintf (ext_res, "fileExtension.%s", ext);
215 if (!(file_type = res_get (common_resource, ext_res)))
218 file_info = dict_lookup (file_idx, kname);
221 sysno = sysno_next++;
222 dict_insert (file_idx, kname, sizeof(sysno), &sysno);
223 lseek (sys_idx_fd, sysno * SYS_IDX_ENTRY_LEN, SEEK_SET);
224 write (sys_idx_fd, kname, strlen(kname)+1);
227 memcpy (&sysno, (char*) file_info+1, sizeof(sysno));
229 if (!strcmp (file_type, "text"))
230 text_extract (t, sysno, cmd, fname);
231 strtab_del (t, key_rec_flush, &cmd);