-/* $Id: zebramap.c,v 1.75 2007-12-13 18:08:26 adam Exp $
- Copyright (C) 1995-2007
- Index Data ApS
-
- This file is part of the Zebra server.
-
- Zebra is free software; you can redistribute it and/or modify it under
- the terms of the GNU General Public License as published by the Free
- Software Foundation; either version 2, or (at your option) any later
- version.
-
- Zebra is distributed in the hope that it will be useful, but WITHOUT ANY
- WARRANTY; without even the implied warranty of MERCHANTABILITY or
- FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
- for more details.
-
- You should have received a copy of the GNU General Public License
- along with Zebra; see the file LICENSE.zebra. If not, write to the
- Free Software Foundation, 59 Temple Place - Suite 330, Boston, MA
- 02111-1307, USA.
+/* This file is part of the Zebra server.
+ Copyright (C) 2004-2013 Index Data
+
+Zebra is free software; you can redistribute it and/or modify it under
+the terms of the GNU General Public License as published by the Free
+Software Foundation; either version 2, or (at your option) any later
+version.
+
+Zebra is distributed in the hope that it will be useful, but WITHOUT ANY
+WARRANTY; without even the implied warranty of MERCHANTABILITY or
+FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
+
*/
+#if HAVE_CONFIG_H
+#include <config.h>
+#endif
#include <assert.h>
#include <stdlib.h>
#include <ctype.h>
}
else if (!zm)
{
- yaz_log(YLOG_WARN, "%s:%d: Missing sort/index before '%s'",
+ yaz_log(YLOG_WARN, "%s:%d: Missing sort/index before '%s'",
fname, lineno, argv[0]);
return -1;
}
zm->u.sort.entry_size = atoi(argv[1]);
else
{
- yaz_log(YLOG_WARN,
- "%s:%d: entrysize only valid in sort section",
+ yaz_log(YLOG_WARN,
+ "%s:%d: entrysize only valid in sort section",
fname, lineno);
return -1;
}
#if YAZ_HAVE_ICU
UErrorCode status;
xmlNode *xml_node = xmlDocGetRootElement(zm->doc);
- zm->icu_chain =
+ zm->icu_chain =
icu_chain_xml_config(xml_node,
/* not sure about sort for this function yet.. */
#if 1
1,
#else
zm->type == ZEBRA_MAP_TYPE_SORT,
-#endif
+#endif
&status);
if (!zm->icu_chain)
{
}
else
{
- yaz_log(YLOG_WARN, "%s:%d: Unrecognized directive '%s'",
+ yaz_log(YLOG_WARN, "%s:%d: Unrecognized directive '%s'",
fname, lineno, argv[0]);
return -1;
}
return zms;
}
+void zebra_maps_define_default_sort(zebra_maps_t zms)
+{
+ zebra_map_t zm = zebra_add_map(zms, "s", ZEBRA_MAP_TYPE_SORT);
+ zm->u.sort.entry_size = 80;
+}
+
zebra_map_t zebra_map_get(zebra_maps_t zms, const char *id)
{
zebra_map_t zm;
if (!zm)
{
zm = zebra_add_map(zms, id, ZEBRA_MAP_TYPE_INDEX);
-
+
/* no reason to warn if no maps are read from file */
if (zms->no_files_read)
yaz_log(YLOG_WARN, "Unknown register type: %s", id);
chrmaptab maptab = zebra_charmap_get(zm);
if (maptab)
return chr_map_input(maptab, from, len, first);
-
+
zm->zebra_maps->temp_map_str[0] = **from;
(*from)++;
const char **from, int len, int *q_map_match)
{
chrmaptab maptab;
-
+
*q_map_match = 0;
maptab = zebra_charmap_get(zm);
if (maptab)
/* ------------------------------------ */
int zebra_maps_is_complete(zebra_map_t zm)
-{
+{
if (zm)
return zm->completeness;
return 0;
return zm->type == ZEBRA_MAP_TYPE_STATICRANK;
return 0;
}
-
+
int zebra_maps_is_sort(zebra_map_t zm)
{
if (zm)
break;
case 106: /* document-text */
*search_type = "or-list";
- break;
+ break;
case -1:
case 1: /* phrase */
case 2: /* word */
- case 108: /* string */
+ case 108: /* string */
*search_type = "phrase";
break;
case 107: /* local-number */
UErrorCode status;
while (icu_chain_next_token(zm->icu_chain, &status))
{
- assert(U_SUCCESS(status));
+ if (!U_SUCCESS(status))
+ return 0;
*result_buf = icu_chain_token_sortkey(zm->icu_chain);
assert(*result_buf);
if (**result_buf != '\0')
return 1;
}
- assert(U_SUCCESS(status));
}
return 0;
#else
int zebra_map_tokenize_start(zebra_map_t zm,
const char *buf, size_t len)
{
+#if YAZ_HAVE_ICU
+ int ret;
+#endif
assert(zm->use_chain);
wrbuf_rewind(zm->input_str);
wrbuf_rewind(zm->print_str);
wrbuf_write_escaped(zm->print_str, wrbuf_buf(zm->input_str),
wrbuf_len(zm->input_str));
-
- yaz_log(YLOG_LOG, "input %s",
- wrbuf_cstr(zm->print_str));
- }
- icu_chain_assign_cstr(zm->icu_chain,
- wrbuf_cstr(zm->input_str),
- &status);
- assert(U_SUCCESS(status));
- }
-#endif
- return 0;
-}
-#if 0
-int zebra_map_tokenize(zebra_map_t zm,
- const char *buf, size_t len,
- const char **result_buf, size_t *result_len)
-{
- assert(zm->use_chain);
-
- if (buf)
- {
- wrbuf_rewind(zm->input_str);
- wrbuf_write(zm->input_str, buf, len);
- zm->simple_off = 0;
- }
-
-#if YAZ_HAVE_ICU
- if (!zm->icu_chain)
- return tokenize_simple(zm, result_buf, result_len);
- else
- {
- UErrorCode status;
- if (buf)
- {
- if (zm->debug)
- {
- wrbuf_rewind(zm->print_str);
- wrbuf_write_escaped(zm->print_str, wrbuf_buf(zm->input_str),
- wrbuf_len(zm->input_str));
-
- yaz_log(YLOG_LOG, "input %s",
- wrbuf_cstr(zm->print_str));
- }
- icu_chain_assign_cstr(zm->icu_chain,
- wrbuf_cstr(zm->input_str),
- &status);
- assert(U_SUCCESS(status));
+ yaz_log(YLOG_LOG, "input %s",
+ wrbuf_cstr(zm->print_str));
}
- while (icu_chain_next_token(zm->icu_chain, &status))
+ ret = icu_chain_assign_cstr(zm->icu_chain,
+ wrbuf_cstr(zm->input_str), &status);
+ if (!ret && !U_SUCCESS(status))
{
- assert(U_SUCCESS(status));
- *result_buf = icu_chain_token_sortkey(zm->icu_chain);
- assert(*result_buf);
-
- *result_len = strlen(*result_buf);
-
if (zm->debug)
{
- wrbuf_rewind(zm->print_str);
- wrbuf_write_escaped(zm->print_str, *result_buf, *result_len);
- yaz_log(YLOG_LOG, "output %s", wrbuf_cstr(zm->print_str));
+ yaz_log(YLOG_WARN, "bad encoding for input");
}
-
- if (**result_buf != '\0')
- return 1;
+ return -1;
}
- assert(U_SUCCESS(status));
}
- return 0;
-#else
- return tokenize_simple(zm, result_buf, result_len);
#endif
+ return 0;
}
-#endif
int zebra_maps_is_icu(zebra_map_t zm)
{
+ assert(zm);
#if YAZ_HAVE_ICU
return zm->use_chain;
#else
/*
* Local variables:
* c-basic-offset: 4
+ * c-file-style: "Stroustrup"
* indent-tabs-mode: nil
* End:
* vim: shiftwidth=4 tabstop=8 expandtab