/*
- * $Id: reclists.c,v 1.2 2007-01-05 20:33:05 adam Exp $
+ * $Id: reclists.c,v 1.7 2007-01-15 04:34:28 quinn Exp $
*/
#include <assert.h>
+#if HAVE_CONFIG_H
+#include <cconfig.h>
+#endif
+
#include <yaz/yaz-util.h>
#include "pazpar2.h"
#include "reclists.h"
+extern struct parameters global_parameters;
+
+// Not threadsafe
+static struct reclist_sortparms *sortparms = 0;
+
struct reclist_bucket
{
- struct record *record;
+ struct record_cluster *record;
struct reclist_bucket *next;
};
-struct record *reclist_read_record(struct reclist *l)
+struct reclist_sortparms *reclist_parse_sortparms(NMEM nmem, const char *parms)
+{
+ struct reclist_sortparms *res = 0;
+ struct reclist_sortparms **rp = &res;
+ struct conf_service *service = config->servers->service;
+
+ if (strlen(parms) > 256)
+ return 0;
+ while (*parms)
+ {
+ char parm[256];
+ char *pp;
+ const char *cpp;
+ int increasing;
+ int i;
+ int offset;
+ enum conf_sortkey_type type;
+ struct reclist_sortparms *new;
+
+ if (!(cpp = strchr(parms, ',')))
+ cpp = parms + strlen(parms);
+ strncpy(parm, parms, cpp - parms);
+ parm[cpp-parms] = '\0';
+
+ if ((pp = strchr(parm, ':')))
+ {
+ increasing = pp[1] == '1' ? 1 : 0;
+ *pp = '\0';
+ }
+ else
+ increasing = 0;
+ if (!strcmp(parm, "relevance"))
+ {
+ type = Metadata_sortkey_relevance;
+ offset = -1;
+ }
+ else
+ {
+ for (i = 0; i < service->num_sortkeys; i++)
+ {
+ struct conf_sortkey *sk = &service->sortkeys[i];
+ if (!strcmp(sk->name, parm))
+ {
+ type = sk->type;
+ if (type == Metadata_sortkey_skiparticle)
+ type = Metadata_sortkey_string;
+ break;
+ }
+ }
+ if (i >= service->num_sortkeys)
+ {
+ yaz_log(YLOG_FATAL, "Bad sortkey: %s", parm);
+ return 0;
+ }
+ else
+ offset = i;
+ }
+ new = *rp = nmem_malloc(nmem, sizeof(struct reclist_sortparms));
+ new->next = 0;
+ new->offset = offset;
+ new->type = type;
+ new->increasing = increasing;
+ rp = &new->next;
+ if (*(parms = cpp))
+ parms++;
+ }
+ return res;
+}
+
+static int reclist_cmp(const void *p1, const void *p2)
+{
+ struct record_cluster *r1 = (*(struct record_cluster**) p1);
+ struct record_cluster *r2 = (*(struct record_cluster**) p2);
+ struct reclist_sortparms *s;
+
+ for (s = sortparms; s; s = s->next)
+ {
+ int res;
+ switch (s->type)
+ {
+ case Metadata_sortkey_relevance:
+ res = r2->relevance - r1->relevance;
+ break;
+ case Metadata_sortkey_string:
+ res = strcmp(r2->sortkeys[s->offset]->text, r1->sortkeys[s->offset]->text);
+ break;
+ case Metadata_sortkey_numeric:
+ res = 0;
+ break;
+ default:
+ yaz_log(YLOG_FATAL, "Bad sort type: %d", s->type);
+ exit(1);
+ }
+ if (res)
+ {
+ if (s->increasing)
+ res *= -1;
+ return res;
+ }
+ }
+ return 0;
+}
+
+void reclist_sort(struct reclist *l, struct reclist_sortparms *parms)
+{
+ sortparms = parms;
+ qsort(l->flatlist, l->num_records, sizeof(struct record_cluster*), reclist_cmp);
+ reclist_rewind(l);
+}
+
+struct record_cluster *reclist_read_record(struct reclist *l)
{
if (l->pointer < l->num_records)
return l->flatlist[l->pointer++];
hashsize <<= 1;
res = nmem_malloc(nmem, sizeof(struct reclist));
res->hashtable = nmem_malloc(nmem, hashsize * sizeof(struct reclist_bucket*));
- bzero(res->hashtable, hashsize * sizeof(struct reclist_bucket*));
+ memset(res->hashtable, 0, hashsize * sizeof(struct reclist_bucket*));
res->hashtable_size = hashsize;
res->nmem = nmem;
res->hashmask = hashsize - 1; // Creates a bitmask
res->num_records = 0;
- res->flatlist = nmem_malloc(nmem, numrecs * sizeof(struct record*));
+ res->flatlist = nmem_malloc(nmem, numrecs * sizeof(struct record_cluster*));
res->flatlist_size = numrecs;
return res;
}
-struct record *reclist_insert(struct reclist *l, struct record *record)
+// Insert a record. Return record cluster (newly formed or pre-existing)
+struct record_cluster *reclist_insert(struct reclist *l, struct record *record,
+ char *merge_key, int *total)
{
unsigned int bucket;
struct reclist_bucket **p;
- struct record *head = 0;
+ struct record_cluster *cluster = 0;
+ struct conf_service *service = global_parameters.server->service;
- bucket = hash((unsigned char*) record->merge_key) & l->hashmask;
+ bucket = hash((unsigned char*) merge_key) & l->hashmask;
for (p = &l->hashtable[bucket]; *p; p = &(*p)->next)
{
// We found a matching record. Merge them
- if (!strcmp(record->merge_key, (*p)->record->merge_key))
+ if (!strcmp(merge_key, (*p)->record->merge_key))
{
- struct record *existing = (*p)->record;
- record->next_cluster = existing->next_cluster;
- existing->next_cluster = record;
- head = existing;
+ struct record_cluster *existing = (*p)->record;
+ record->next = existing->records;
+ existing->records = record;
+ cluster = existing;
break;
}
}
- if (!head && l->num_records < l->flatlist_size)
+ if (!cluster && l->num_records < l->flatlist_size)
{
struct reclist_bucket *new =
nmem_malloc(l->nmem, sizeof(struct reclist_bucket));
+ struct record_cluster *newc =
+ nmem_malloc(l->nmem, sizeof(struct record_cluster));
- assert(!*p);
-
- new->record = record;
- record->next_cluster = 0;
+ record->next = 0;
+ new->record = newc;
new->next = 0;
+ newc->records = record;
+ newc->merge_key = merge_key;
+ newc->relevance = 0;
+ newc->term_frequency_vec = 0;
+ newc->recid = (*total)++;
+ newc->metadata = nmem_malloc(l->nmem,
+ sizeof(struct record_metadata*) * service->num_metadata);
+ memset(newc->metadata, 0, sizeof(struct record_metadata*) * service->num_metadata);
+ newc->sortkeys = nmem_malloc(l->nmem,
+ sizeof(struct record_metadata*) * service->num_sortkeys);
+ memset(newc->sortkeys, 0, sizeof(union data_types*) * service->num_sortkeys);
+
*p = new;
- assert(l->num_records < l->flatlist_size);
- l->flatlist[l->num_records++] = record;
- head = record;
+ l->flatlist[l->num_records++] = newc;
+ cluster = newc;
}
- return head;
+ return cluster;
}