1 /* $Id: test_relevance.c,v 1.2 2007-04-17 13:30:24 marc Exp $
2 Copyright (c) 2006-2007, Index Data.
4 This file is part of Pazpar2.
6 Pazpar2 is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 2, or (at your option) any later
11 Pazpar2 is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 You should have received a copy of the GNU General Public License
17 along with Pazpar2; see the file LICENSE. If not, write to the
18 Free Software Foundation, 59 Temple Place - Suite 330, Boston, MA
27 #include <sys/socket.h>
39 #include <yaz/timing.h>
45 //#include "pazpar2.h"
46 #include "relevance.h"
55 void test_relevance(int argc, char **argv)
57 NMEM nmem = nmem_create();
60 const char * queryterms[] =
62 // {"ål", "økologi", "æble", 0};
64 struct record_cluster *cluster = 0;
65 struct conf_service service;
66 struct reclist *list = 0;
67 struct record *record = 0;
68 const char *mergekey = "amergekey";
71 struct relevance *rel = 0;
73 rel = relevance_create(nmem, queryterms, numrecs);
74 list = reclist_create(nmem, numrecs);
76 // setting up service - sic!
77 // this should have been done by a nice service_create function !!!
79 service.num_metadata = 1;
81 service.num_sortkeys = 0;
83 if (service.num_metadata)
86 sizeof(struct conf_metadata) * service.num_metadata);
89 service.metadata->name = nmem_strdup(nmem, "aname");
90 //service.metadata->brief = 1;
91 //service.metadata->termlist = 1;
92 //service.metadata->rank = 1;
93 //service.metadata->type = Metadata_type_generic;
94 //service.metadata->type = Metadata_type_year;
95 //service.metadata->merge = Metadata_merge_no;
96 //service.metadata->merge = Metadata_merge_unique;
97 //service.metadata->merge = Metadata_merge_longest;
98 //service.metadata->merge = Metadata_merge_range;
99 //service.metadata->merge = Metadata_merge_all;
102 if (service.num_sortkeys)
105 sizeof(struct conf_sortkey) * service.num_sortkeys);
107 service.sortkeys = 0;
108 // service.sortkeys.type = Metadata_sortkey_numeric;
109 // service.sortkeys.type = Metadata_sortkey_skiparticle;
110 // service.sortkeys.name = service.metadata->name;
111 //service.metadata->sortkey_offset = sk_node;
115 // preparing one record
116 // this should have been done by a nice record_create function
117 // why the heck does the record know which client it belongs to ??
119 record = nmem_malloc(nmem, sizeof(struct record));
121 // which client should I use for record->client = cl; ??
123 // and which sortkeys data_types list should I use ??
124 record->sortkeys = 0;
127 sizeof(struct record_metadata*) * service.num_metadata);
128 memset(record->metadata, 0,
129 sizeof(struct record_metadata*) * service.num_metadata);
132 // now we need to put some actual data into the record ... how ??
133 // there is a hell of a lot spagetti code in logic.c ingest_record()
134 // line 694 ff snippet from there:
135 // this code needs to be analyzed and the fundamental stuff extracted
138 service->metadata[imeta].name;
139 md = &service->metadata[imeta];
140 if (md->sortkey_offset >= 0)
141 sk = &service->sortkeys[md->sortkey_offset];
144 // Find out where we are putting it if (md->merge == Metadata_merge_no)
145 wheretoput = &res->metadata[imeta];
147 wheretoput = &cluster->metadata[imeta];
151 newm = nmem_malloc(se->nmem, sizeof(struct record_metadata));
153 if (md->type == Metadata_type_generic)
156 for (p = (char *) value; *p && isspace(*p); p++)
158 for (pe = p + strlen(p) - 1;
159 pe > p && strchr(" ,/.:([", *pe); pe--)
161 newm->data.text = nmem_strdup(se->nmem, p);
164 else if (md->type == Metadata_type_year)
166 if (extract_years((char *) value, &first, &last) < 0)
171 yaz_log(YLOG_WARN, "Unknown type in metadata element %s", type);
174 if (md->type == Metadata_type_year && md->merge != Metadata_merge_range)
176 yaz_log(YLOG_WARN, "Only range merging supported for years");
179 if (md->merge == Metadata_merge_unique)
181 struct record_metadata *mnode;
182 for (mnode = *wheretoput; mnode; mnode = mnode->next)
183 if (!strcmp((const char *) mnode->data.text, newm->data.text))
187 newm->next = *wheretoput;
191 else if (md->merge == Metadata_merge_longest)
194 strlen(newm->data.text) > strlen((*wheretoput)->data.text))
199 char *s = nmem_strdup(se->nmem, newm->data.text);
200 if (!cluster->sortkeys[md->sortkey_offset])
201 cluster->sortkeys[md->sortkey_offset] =
202 nmem_malloc(se->nmem, sizeof(union data_types));
203 normalize_mergekey(s,
204 (sk->type == Metadata_sortkey_skiparticle));
205 cluster->sortkeys[md->sortkey_offset]->text = s;
209 else if (md->merge == Metadata_merge_all || md->merge == Metadata_merge_no)
211 newm->next = *wheretoput;
214 else if (md->merge == Metadata_merge_range)
216 assert(md->type == Metadata_type_year);
220 (*wheretoput)->data.number.min = first;
221 (*wheretoput)->data.number.max = last;
223 cluster->sortkeys[md->sortkey_offset] = &newm->data;
227 if (first < (*wheretoput)->data.number.min)
228 (*wheretoput)->data.number.min = first;
229 if (last > (*wheretoput)->data.number.max)
230 (*wheretoput)->data.number.max = last;
233 relevance_countwords(se->relevance, cluster,
234 (char *) value, md->rank);
237 if (md->type == Metadata_type_year)
240 sprintf(year, "%d", last);
241 add_facet(se, (char *) type, year);
244 sprintf(year, "%d", first);
245 add_facet(se, (char *) type, year);
249 add_facet(se, (char *) type, (char *) value);
253 //mergekey_norm = (xmlChar *) nmem_strdup(se->nmem, (char*) mergekey);
254 //normalize_mergekey((char *) mergekey_norm, 0);
257 // insert one record into recordlist/cluster - what's a cluster, exactly??
258 cluster = reclist_insert(list, &service, record, (char *)mergekey, &total);
261 relevance_newrec(rel, cluster);
269 //relevance_prepare_read(rel, list);
272 //relevance_donerecord(rel, cluster);
273 // relevance_countwords(se->rel, cluster,
274 // (char *) value, service.metadata->rank);
286 int main(int argc, char **argv)
288 YAZ_CHECK_INIT(argc, argv);
292 test_relevance(argc, argv);
304 * indent-tabs-mode: nil
306 * vim: shiftwidth=4 tabstop=8 expandtab