1 /* This file is part of the YAZ toolkit.
2 * Copyright (C) 1995-2012 Index Data
3 * See the file LICENSE for details.
7 * \file marc_read_iso2709.c
8 * \brief Implements reading of MARC as ISO2709
21 #include <yaz/marcdisp.h>
22 #include <yaz/wrbuf.h>
23 #include <yaz/yaz-util.h>
25 int yaz_marc_read_iso2709(yaz_marc_t mt, const char *buf, int bsize)
30 int identifier_length;
33 int length_data_entry;
35 int length_implementation;
39 record_length = atoi_n (buf, 5);
40 if (record_length < 25)
42 yaz_marc_cprintf(mt, "Record length %d < 24", record_length);
45 /* ballout if bsize is known and record_length is less than that */
46 if (bsize != -1 && record_length > bsize)
48 yaz_marc_cprintf(mt, "Record appears to be larger than buffer %d < %d",
49 record_length, bsize);
52 if (yaz_marc_get_debug(mt))
53 yaz_marc_cprintf(mt, "Record length %5d", record_length);
55 yaz_marc_set_leader(mt, buf,
61 &length_implementation);
63 /* First pass. determine length of directory & base of data */
64 for (entry_p = 24; buf[entry_p] != ISO2709_FS; )
66 /* length of directory entry */
67 int l = 3 + length_data_entry + length_starting;
68 if (entry_p + l >= record_length)
70 yaz_marc_cprintf(mt, "Directory offset %d: end of record."
71 " Missing FS char", entry_p);
74 if (yaz_marc_get_debug(mt))
76 WRBUF hex = wrbuf_alloc();
78 wrbuf_puts(hex, "Tag ");
79 wrbuf_write_escaped(hex, buf + entry_p, 3);
80 wrbuf_puts(hex, ", length ");
81 wrbuf_write_escaped(hex, buf + entry_p + 3,
83 wrbuf_puts(hex, ", starting ");
84 wrbuf_write_escaped(hex, buf + entry_p + 3 + length_data_entry,
86 yaz_marc_cprintf(mt, "Directory offset %d: %s",
87 entry_p, wrbuf_cstr(hex));
90 /* Check for digits in length+starting info */
92 if (!yaz_isdigit(buf[entry_p + l]))
96 WRBUF hex = wrbuf_alloc();
97 /* Not all digits, so stop directory scan */
98 wrbuf_write_escaped(hex, buf + entry_p,
99 length_data_entry + length_starting + 3);
100 yaz_marc_cprintf(mt, "Directory offset %d: Bad value for data"
101 " length and/or length starting (%s)", entry_p,
106 entry_p += 3 + length_data_entry + length_starting;
108 end_of_directory = entry_p;
109 if (base_address != entry_p+1)
111 yaz_marc_cprintf(mt, "Base address not at end of directory,"
112 " base %d, end %d", base_address, entry_p+1);
115 /* Second pass. parse control - and datafields */
116 for (entry_p = 24; entry_p != end_of_directory; )
123 int identifier_flag = 0;
124 int entry_p0 = entry_p;
126 memcpy (tag, buf+entry_p, 3);
129 data_length = atoi_n(buf+entry_p, length_data_entry);
130 entry_p += length_data_entry;
131 data_offset = atoi_n(buf+entry_p, length_starting);
132 entry_p += length_starting;
133 i = data_offset + base_address;
134 end_offset = i+data_length-1;
136 if (data_length <= 0 || data_offset < 0)
139 if (yaz_marc_get_debug(mt))
141 yaz_marc_cprintf(mt, "Tag: %s. Directory offset %d: data-length %d,"
143 tag, entry_p0, data_length, data_offset);
145 if (end_offset >= record_length)
147 yaz_marc_cprintf(mt, "Directory offset %d: Data out of bounds %d >= %d",
148 entry_p0, end_offset, record_length);
152 if (memcmp (tag, "00", 2))
153 identifier_flag = 1; /* if not 00X assume subfields */
154 else if (indicator_length < 4 && indicator_length > 0)
156 /* Danmarc 00X have subfields */
157 if (buf[i + indicator_length] == ISO2709_IDFS)
159 else if (buf[i + indicator_length + 1] == ISO2709_IDFS)
166 i += identifier_flag-1;
167 if (indicator_length)
169 /* skip RS/FS bytes in indicator. They are not allowed there */
171 for (j = indicator_length; --j >= 0; )
177 yaz_marc_cprintf(mt, "Bad indicator data. "
178 "Skipping %d bytes", j);
181 yaz_marc_add_datafield(mt, tag, buf+i, indicator_length);
182 i += indicator_length;
185 while (i < end_offset &&
186 buf[i] != ISO2709_RS && buf[i] != ISO2709_FS)
188 int code_offset = i+1;
191 while (i < end_offset &&
192 buf[i] != ISO2709_RS && buf[i] != ISO2709_IDFS &&
193 buf[i] != ISO2709_FS)
196 yaz_marc_add_subfield(mt, buf+code_offset, i - code_offset);
203 while (i < end_offset &&
204 buf[i] != ISO2709_RS && buf[i] != ISO2709_FS)
206 yaz_marc_add_controlfield(mt, tag, buf+i0, i-i0);
210 yaz_marc_cprintf(mt, "Separator but not at end of field length=%d",
213 if (buf[i] != ISO2709_RS && buf[i] != ISO2709_FS)
215 yaz_marc_cprintf(mt, "No separator at end of field length=%d",
219 return record_length;
225 * c-file-style: "Stroustrup"
226 * indent-tabs-mode: nil
228 * vim: shiftwidth=4 tabstop=8 expandtab