[10365] | 1 | /* ------------------------------------------------------------------- */
|
---|
| 2 | /* MARC2709 : Converts a "line format MARC record" into ISO 2709 */
|
---|
| 3 | /* */
|
---|
| 4 | /* Input string requirements: */
|
---|
| 5 | /* 1. New MARC tag is indicated by MARC tag in pos 1-3 */
|
---|
| 6 | /* (may be preceded by *). Indicator follows in next 2 */
|
---|
| 7 | /* bytes. */
|
---|
| 8 | /* 2. Continuation line is indicated by blank in col 1 */
|
---|
| 9 | /* 3. End-of-record (^) may or may not be present */
|
---|
| 10 | /* */
|
---|
| 11 | /* author : Ole Husby */
|
---|
| 12 | /* updated : 1998-09-30 */
|
---|
| 13 | /* ------------------------------------------------------------------- */
|
---|
| 14 |
|
---|
| 15 | #include <stdlib.h>
|
---|
| 16 | #include <stdio.h>
|
---|
| 17 | #include <string.h>
|
---|
| 18 | #include <ctype.h>
|
---|
| 19 |
|
---|
| 20 | #define NORMARC 12
|
---|
| 21 |
|
---|
| 22 | #define SUBFIELD_CODE "\x1f"
|
---|
| 23 | #define FIELD_TERMINATOR "\x1e"
|
---|
| 24 | #define RECORD_TERMINATOR "\x1d"
|
---|
| 25 |
|
---|
| 26 | #define INDICATOR_COUNT '2'
|
---|
| 27 | #define SUBFIELD_CODE_COUNT '2'
|
---|
| 28 | #define LENGTH_OF_LENGTH_OF_FIELD '4'
|
---|
| 29 | #define LENGTH_OF_STARTING_CHARACTER_POSITION '5'
|
---|
| 30 | #define UNUSED " "
|
---|
| 31 | #define TAG001 "001"
|
---|
| 32 | #define TAG008 "008"
|
---|
| 33 | #define SKIP 41
|
---|
| 34 |
|
---|
| 35 | static char out_record[10240],
|
---|
| 36 | leader[24+1],
|
---|
| 37 | directory[10240],
|
---|
| 38 | field_001[32],
|
---|
| 39 | field_008[40+2],
|
---|
| 40 | data_field[10240];
|
---|
| 41 |
|
---|
| 42 |
|
---|
| 43 | static char logline[128];
|
---|
| 44 | static char rstr[6], dollar, dollarstring[2];
|
---|
| 45 | static int skip;
|
---|
| 46 |
|
---|
| 47 | static char direlem[300][12+1];
|
---|
| 48 | static int dircntr;
|
---|
| 49 |
|
---|
| 50 | union LDR {
|
---|
| 51 | char ldr_string[24+1];
|
---|
| 52 | struct {
|
---|
| 53 | char record_length[5],
|
---|
| 54 | record_status,
|
---|
| 55 | record_type,
|
---|
| 56 | bibliographic_level,
|
---|
| 57 | unused1[2],
|
---|
| 58 | indicator_count,
|
---|
| 59 | subfield_code_count,
|
---|
| 60 | base_adress[5],
|
---|
| 61 | unused2[3],
|
---|
| 62 | entry1,
|
---|
| 63 | entry2,
|
---|
| 64 | entry3,
|
---|
| 65 | entry4;
|
---|
| 66 | } ltab;
|
---|
| 67 | } ldr;
|
---|
| 68 |
|
---|
| 69 | static int startet = 0;
|
---|
| 70 |
|
---|
| 71 |
|
---|
| 72 |
|
---|
| 73 | /* ------------------------------------------------------------------- */
|
---|
| 74 | /* Compare function for qsort */
|
---|
| 75 | /* ------------------------------------------------------------------- */
|
---|
| 76 |
|
---|
| 77 | int cmp(const void *a, const void *b)
|
---|
| 78 | {
|
---|
| 79 | return strcmp((char*)a, (char*)b);
|
---|
| 80 | }
|
---|
| 81 |
|
---|
| 82 |
|
---|
| 83 |
|
---|
| 84 |
|
---|
| 85 | /* ------------------------------------------------------------------- */
|
---|
| 86 | /* Convert integer to string of fixed length. Right justified padded */
|
---|
| 87 | /* with zeros. Returns NULL if error */
|
---|
| 88 | /* ------------------------------------------------------------------- */
|
---|
| 89 |
|
---|
| 90 | char *itoal(int n, int len)
|
---|
| 91 | {
|
---|
| 92 | char *r;
|
---|
| 93 | r = (char *) rstr;
|
---|
| 94 |
|
---|
| 95 | switch (len)
|
---|
| 96 | {
|
---|
| 97 | case 4 : sprintf(r, "%04d", n); break;
|
---|
| 98 | case 5 : sprintf(r, "%05d", n); break;
|
---|
| 99 | default : return NULL;
|
---|
| 100 | }
|
---|
| 101 |
|
---|
| 102 | r[len] = '\0';
|
---|
| 103 |
|
---|
| 104 | return r;
|
---|
| 105 | }
|
---|
| 106 |
|
---|
| 107 |
|
---|
| 108 |
|
---|
| 109 | /* ------------------------------------------------------------------- */
|
---|
| 110 | /* One 001 subfield is put into field_001 */
|
---|
| 111 | /* ------------------------------------------------------------------- */
|
---|
| 112 |
|
---|
| 113 | static int make_001(char *data, char subfield)
|
---|
| 114 | {
|
---|
| 115 | int len;
|
---|
| 116 |
|
---|
| 117 | startet = 0;
|
---|
| 118 | switch (subfield)
|
---|
| 119 | {
|
---|
| 120 | case ' ' : break;
|
---|
| 121 | case 'a' : break;
|
---|
| 122 | default : return 1;
|
---|
| 123 | }
|
---|
| 124 |
|
---|
| 125 | while (data[0] == ' ') data++;
|
---|
| 126 | strcpy(field_001, data);
|
---|
| 127 |
|
---|
| 128 | len = strlen(data) + 1;
|
---|
| 129 | skip = SKIP + len;
|
---|
| 130 |
|
---|
| 131 | sprintf(directory, "00100%2d000000080041000%2d", len, len);
|
---|
| 132 | return 1;
|
---|
| 133 | }
|
---|
| 134 |
|
---|
| 135 |
|
---|
| 136 |
|
---|
| 137 | /* ------------------------------------------------------------------- */
|
---|
| 138 | /* One subfield string is appended to data_field */
|
---|
| 139 | /* ------------------------------------------------------------------- */
|
---|
| 140 |
|
---|
| 141 | static int out_subfield(char *data, char *ftag, char subfield, char nextsubfield)
|
---|
| 142 | {
|
---|
| 143 | int len, subint;
|
---|
| 144 | char subreplace, *p, *up;
|
---|
| 145 |
|
---|
| 146 | while (data[strlen(data) -1] == ' ')
|
---|
| 147 | data[strlen(data) -1] = '\0'; /* strip trailing blanks */
|
---|
| 148 |
|
---|
| 149 | if (subfield == '3') /* always discard $3 */
|
---|
| 150 | return 1;
|
---|
| 151 |
|
---|
| 152 | if (strcmp(ftag, TAG001) == 0) /* 001 data treatment */
|
---|
| 153 | {
|
---|
| 154 | make_001(data, subfield);
|
---|
| 155 | return 1;
|
---|
| 156 | }
|
---|
| 157 |
|
---|
| 158 | if (strcmp(ftag, TAG008) == 0) /* 008 data treatment */
|
---|
| 159 | {
|
---|
| 160 | strncpy(field_008, data, strlen(data));
|
---|
| 161 | return 1;
|
---|
| 162 | }
|
---|
| 163 |
|
---|
| 164 | if (subfield != ' ') /* handle subfield code */
|
---|
| 165 | {
|
---|
| 166 | strcat(data_field, SUBFIELD_CODE);
|
---|
| 167 | len = strlen(data_field);
|
---|
| 168 | data_field[len] = subfield;
|
---|
| 169 | data_field[len + 1] = '\0';
|
---|
| 170 | }
|
---|
| 171 |
|
---|
| 172 | while(data[0] == ' ') data++; /* strip leading blanks */
|
---|
| 173 | if (!data) return 0;
|
---|
| 174 |
|
---|
| 175 | strcat(data_field, data); /* append data */
|
---|
| 176 |
|
---|
| 177 | return 1;
|
---|
| 178 | }
|
---|
| 179 |
|
---|
| 180 |
|
---|
| 181 |
|
---|
| 182 | /* ------------------------------------------------------------------- */
|
---|
| 183 | /* One MARC field is split into subfields and given to output */
|
---|
| 184 | /* ------------------------------------------------------------------- */
|
---|
| 185 |
|
---|
| 186 | static int out_field(char *data, char *ftag, char *find)
|
---|
| 187 | {
|
---|
| 188 | char lnumber[5], snumber[6];
|
---|
| 189 | int fStart, fLen, moresubs;
|
---|
| 190 | char subfield[5120], *sub, subcode, *nextsub, nextsubcode;
|
---|
| 191 | char *v, subfield_v[32];
|
---|
| 192 |
|
---|
| 193 | if (!startet) return 1;
|
---|
| 194 |
|
---|
| 195 | if ((strncmp(ftag, "00", 2) == 0) &&
|
---|
| 196 | (strcmp(ftag, TAG001) != 0) &&
|
---|
| 197 | (strcmp(ftag, TAG008) != 0))
|
---|
| 198 | return 1;
|
---|
| 199 |
|
---|
| 200 | fStart = strlen(data_field);
|
---|
| 201 |
|
---|
| 202 | if (strncmp(data, " $", 3) == 0) data +=2; /* possible if 008 */
|
---|
| 203 |
|
---|
| 204 | if (data[0] != dollar) /* Dollar sign missing */
|
---|
| 205 | {
|
---|
| 206 | if (strncmp(ftag,"00",2) != 0) return 0; /* only allowed if tag=00x */
|
---|
| 207 |
|
---|
| 208 | if (strcmp(ftag, TAG001) == 0) /* 001: skip leading blanks */
|
---|
| 209 | while (data[0] == ' ')
|
---|
| 210 | data++;
|
---|
| 211 |
|
---|
[10385] | 212 | subcode = ' ';
|
---|
[10365] | 213 | nextsubcode = ' ';
|
---|
| 214 |
|
---|
| 215 | if (!out_subfield(data, ftag, subcode, nextsubcode))
|
---|
| 216 | return 0;
|
---|
| 217 | return 1;
|
---|
| 218 | }
|
---|
| 219 |
|
---|
| 220 | else
|
---|
| 221 | {
|
---|
| 222 | data++;
|
---|
| 223 |
|
---|
| 224 | if (!data) return 0;
|
---|
| 225 |
|
---|
| 226 | if (strncmp(ftag,"00",2) != 0) /* append indicators */
|
---|
| 227 | strcat(data_field, find);
|
---|
| 228 |
|
---|
| 229 | sub = strtok(data, dollarstring); /* first subfield */
|
---|
| 230 | if (!sub)
|
---|
| 231 | return 0;
|
---|
| 232 |
|
---|
| 233 | /* printf("--- %s\n", sub); */
|
---|
| 234 |
|
---|
| 235 | subcode = sub[0];
|
---|
| 236 | sub++;
|
---|
| 237 |
|
---|
| 238 | moresubs = 1;
|
---|
| 239 |
|
---|
| 240 | while (moresubs) /* loop while more subflds */
|
---|
| 241 | {
|
---|
| 242 | nextsub = strtok(NULL, dollarstring); /* next subfld */
|
---|
| 243 | if (nextsub)
|
---|
| 244 | {
|
---|
| 245 | /* printf("--- %s\n", nextsub); */
|
---|
| 246 | nextsubcode = nextsub[0];
|
---|
| 247 | nextsub++;
|
---|
| 248 | }
|
---|
| 249 | else
|
---|
| 250 | nextsubcode = ' ';
|
---|
| 251 |
|
---|
| 252 | if (sub)
|
---|
| 253 | {
|
---|
| 254 | if (!out_subfield(sub, ftag, subcode, nextsubcode))
|
---|
| 255 | return 0;
|
---|
| 256 | /* printf("Denne |%c| Neste |%c|\n", subcode, nextsubcode); */
|
---|
| 257 | }
|
---|
| 258 |
|
---|
| 259 | if (nextsub)
|
---|
| 260 | {
|
---|
| 261 | subcode = nextsubcode;
|
---|
| 262 | sub = nextsub;
|
---|
| 263 | }
|
---|
| 264 | else
|
---|
| 265 | moresubs = 0;
|
---|
| 266 | }
|
---|
| 267 | }
|
---|
| 268 |
|
---|
| 269 | if (strcmp(ftag,TAG001) == 0 || strcmp(ftag,TAG008) == 0)
|
---|
| 270 | return 1; /* directory ready */
|
---|
| 271 |
|
---|
| 272 | strcat(data_field, FIELD_TERMINATOR); /* terminate data field */
|
---|
| 273 | fLen = strlen(data_field) - fStart; /* length of field */
|
---|
| 274 |
|
---|
| 275 | strcpy(lnumber,itoal(fLen,4)); /* convert to 4digit str */
|
---|
| 276 | if (!lnumber) return 0;
|
---|
| 277 | strcpy(snumber,itoal(fStart + skip,5)); /* convert start */
|
---|
| 278 | if (!snumber) return 0;
|
---|
| 279 |
|
---|
| 280 | strcpy(direlem[dircntr], ftag); /* start direlem with tag */
|
---|
| 281 | strcat(direlem[dircntr], lnumber); /* append length to dir */
|
---|
| 282 | strcat(direlem[dircntr], snumber); /* append start to dir */
|
---|
| 283 | dircntr++;
|
---|
| 284 |
|
---|
| 285 | return 1;
|
---|
| 286 | }
|
---|
| 287 |
|
---|
| 288 |
|
---|
| 289 |
|
---|
| 290 | /* ------------------------------------------------------------------- */
|
---|
| 291 | /* Main program */
|
---|
| 292 | /* ------------------------------------------------------------------- */
|
---|
| 293 |
|
---|
| 294 | char *MARC2709(char *record, int last, int first, char recstatus,
|
---|
| 295 | char rectype, char biblevel)
|
---|
| 296 | {
|
---|
| 297 | static char buffer[10240], field_data[5120], tag[4], ind[3];
|
---|
| 298 | char alen[3], *cp, *buf = buffer, *cq, logline[128];
|
---|
| 299 | int prelen, ii;
|
---|
| 300 | int lastchar, Last, First, x, more;
|
---|
| 301 | int SOF, digits, newField;
|
---|
| 302 |
|
---|
| 303 | char test[6];
|
---|
| 304 |
|
---|
| 305 | strcpy(buf, record);
|
---|
| 306 |
|
---|
| 307 | Last = First = 0; /* initialize */
|
---|
| 308 | if (last > 0) /* Last : linelength if */
|
---|
| 309 | { /* fixed */
|
---|
| 310 | Last = last; /* First: starting col */
|
---|
| 311 | First = first; /* for cont. line */
|
---|
| 312 | }
|
---|
| 313 |
|
---|
| 314 | prelen = 5;
|
---|
| 315 | dollar = '$';
|
---|
| 316 | strcpy(dollarstring, "$");
|
---|
| 317 |
|
---|
| 318 | data_field[0] = '\0';
|
---|
| 319 | directory[0] = '\0';
|
---|
| 320 | strcpy(field_001, " ");
|
---|
| 321 | strcpy(field_008, " ");
|
---|
| 322 | out_record[0] = '\0';
|
---|
| 323 | dircntr = 0;
|
---|
| 324 | startet = 0;
|
---|
| 325 |
|
---|
| 326 | /* initialize directory with 9 bytes for 001 */
|
---|
| 327 |
|
---|
| 328 | sprintf(directory, "001001000000008004100010", alen, alen);
|
---|
| 329 | skip = SKIP + 10;
|
---|
| 330 |
|
---|
| 331 | more = 1;
|
---|
| 332 | while (more) /* loop until EOR */
|
---|
| 333 | {
|
---|
| 334 | x = 0; /* x counts bytes */
|
---|
| 335 |
|
---|
| 336 | for (cp = buf; *cp && *cp != '\n'; cp++) x++; /* read until LF */
|
---|
| 337 |
|
---|
| 338 | if (!*cp) /* EOR */
|
---|
| 339 | more = 0;
|
---|
| 340 | else
|
---|
| 341 | cp++;
|
---|
| 342 |
|
---|
| 343 | SOF = 0;
|
---|
| 344 |
|
---|
| 345 | if (buf[0] == '^') break; /* "EOR-line" */
|
---|
| 346 | if (buf[0] == '*') /* skip leading * */
|
---|
| 347 | {
|
---|
| 348 | buf++;
|
---|
| 349 | x--;
|
---|
| 350 | SOF = 1;
|
---|
| 351 | }
|
---|
| 352 |
|
---|
| 353 | if (x == 0) continue; /* empty line */
|
---|
| 354 |
|
---|
| 355 | digits = 1; /* test if first 3 */
|
---|
| 356 | for (ii = 0; ii < 3; ii++) /* bytes are digits */
|
---|
| 357 | if (!isdigit(buf[ii]))
|
---|
| 358 | {
|
---|
| 359 | digits = 0;
|
---|
| 360 | break;
|
---|
| 361 | }
|
---|
| 362 |
|
---|
| 363 | newField = 0;
|
---|
| 364 |
|
---|
| 365 | if (SOF)
|
---|
| 366 | {
|
---|
| 367 | if (!digits) continue; /* illegal line */
|
---|
| 368 | else newField = 1;
|
---|
| 369 | }
|
---|
| 370 | else
|
---|
| 371 | if (digits) newField = 1;
|
---|
| 372 |
|
---|
| 373 |
|
---|
| 374 | if (newField) /* start of new field */
|
---|
| 375 | {
|
---|
| 376 | if (!out_field(field_data, tag, ind)) /* output prev. field */
|
---|
| 377 | return NULL;
|
---|
| 378 |
|
---|
| 379 | startet = 1;
|
---|
| 380 | field_data[0] = '\0'; /* reset field buffer */
|
---|
| 381 | strncpy(tag, buf, 3); /* keep MARC tag */
|
---|
| 382 | buf += 3;
|
---|
| 383 | x -=3;
|
---|
| 384 |
|
---|
| 385 | if (strncmp(tag, "00", 2) != 0)
|
---|
| 386 | {
|
---|
| 387 | strncpy(ind, buf, 2); /* keep indicator */
|
---|
| 388 | buf += 2; /* if not control field */
|
---|
| 389 | x -= 2;
|
---|
| 390 | }
|
---|
| 391 |
|
---|
| 392 | strncat(field_data, buf, x); /* keep data */
|
---|
| 393 |
|
---|
| 394 | /* strip trailing blanks */
|
---|
| 395 | while (field_data[strlen(field_data) -1] == ' ')
|
---|
| 396 | {
|
---|
| 397 | field_data[strlen(field_data) -1] = '\0';
|
---|
| 398 | x--;
|
---|
| 399 | }
|
---|
| 400 |
|
---|
| 401 | if (Last && x == (Last - prelen)) /* full line */
|
---|
| 402 | lastchar = 1;
|
---|
| 403 | else
|
---|
| 404 | lastchar = 0;
|
---|
| 405 | }
|
---|
| 406 |
|
---|
| 407 | else /* continuation line */
|
---|
| 408 | {
|
---|
| 409 | if (Last)
|
---|
| 410 | {
|
---|
| 411 | cq = buf + First - 1; /* skip fixed nmbr chars */
|
---|
| 412 | x -= (First - 1);
|
---|
| 413 | if (!lastchar && cq[0] != ' ' /* and insert one blank */
|
---|
| 414 | && cq[0] != dollar)
|
---|
| 415 | strcat(field_data, " "); /* if needed */
|
---|
| 416 | }
|
---|
| 417 | else
|
---|
| 418 | {
|
---|
| 419 | for (cq = buf; *cq == ' '; cq++) x--; /* skip leading blanks */
|
---|
| 420 | strcat(field_data, " "); /* insert one blank */
|
---|
| 421 | }
|
---|
| 422 |
|
---|
| 423 | strncat(field_data, cq, x); /* append data */
|
---|
| 424 | /* strip trail. blanks */
|
---|
| 425 | while (field_data[strlen(field_data) -1] == ' ')
|
---|
| 426 | {
|
---|
| 427 | field_data[strlen(field_data) -1] = '\0';
|
---|
| 428 | x--;
|
---|
| 429 | }
|
---|
| 430 |
|
---|
| 431 | if (Last && x == (Last - 5)) /* full line */
|
---|
| 432 | lastchar = 1;
|
---|
| 433 | else lastchar = 0;
|
---|
| 434 |
|
---|
| 435 | }
|
---|
| 436 |
|
---|
| 437 | while (field_data[strlen(field_data) -1] == ' ')
|
---|
| 438 | field_data[strlen(field_data) - 1] = '\0'; /* rm trailing blanks */
|
---|
| 439 | buf = cp;
|
---|
| 440 | }
|
---|
| 441 |
|
---|
| 442 | if (!out_field(field_data, tag, ind)) /* output last field */
|
---|
| 443 | return NULL;
|
---|
| 444 |
|
---|
| 445 | /* terminate field_001 */
|
---|
| 446 | strcat(field_001, FIELD_TERMINATOR);
|
---|
| 447 |
|
---|
| 448 | field_008[40] = '\0'; /* terminate field_008 */
|
---|
| 449 | strcat(field_008, FIELD_TERMINATOR);
|
---|
| 450 |
|
---|
| 451 | /* sort directory elem. */
|
---|
| 452 | qsort ((void *) direlem, dircntr, sizeof(direlem[0]), cmp);
|
---|
| 453 | for (ii = 0; ii < dircntr; ii++)
|
---|
| 454 | strcat(directory, direlem[ii]); /* append to directory */
|
---|
| 455 |
|
---|
| 456 | strcat(directory, FIELD_TERMINATOR); /* terminate dictionary */
|
---|
| 457 |
|
---|
| 458 | strcat(data_field, RECORD_TERMINATOR); /* terminate data */
|
---|
| 459 |
|
---|
| 460 | x = 24 + strlen(directory); /* construct leader */
|
---|
| 461 |
|
---|
| 462 | strcpy(test, itoal(x,5));
|
---|
| 463 |
|
---|
| 464 | strncpy(ldr.ltab.base_adress, test, 5);
|
---|
| 465 |
|
---|
| 466 | x += (strlen(data_field)
|
---|
| 467 | + strlen(field_001)
|
---|
| 468 | + strlen(field_008));
|
---|
| 469 |
|
---|
| 470 | strcpy(test, itoal(x,5));
|
---|
| 471 |
|
---|
| 472 | strncpy(ldr.ltab.record_length, test, 5);
|
---|
| 473 |
|
---|
| 474 | ldr.ltab.record_status = recstatus;
|
---|
| 475 | ldr.ltab.record_type = rectype;
|
---|
| 476 | ldr.ltab.bibliographic_level = biblevel;
|
---|
| 477 | ldr.ltab.indicator_count = INDICATOR_COUNT;
|
---|
| 478 | ldr.ltab.subfield_code_count = SUBFIELD_CODE_COUNT;
|
---|
| 479 | strncpy(ldr.ltab.unused1,UNUSED,2);
|
---|
| 480 | strncpy(ldr.ltab.unused2,UNUSED,3);
|
---|
| 481 | ldr.ltab.entry1 = LENGTH_OF_LENGTH_OF_FIELD;
|
---|
| 482 | ldr.ltab.entry2 = LENGTH_OF_STARTING_CHARACTER_POSITION;
|
---|
| 483 | ldr.ltab.entry3 = '0';
|
---|
| 484 | ldr.ltab.entry4 = '0';
|
---|
| 485 |
|
---|
| 486 | ldr.ldr_string[24] = '\0';
|
---|
| 487 |
|
---|
| 488 | strcpy(out_record, ldr.ldr_string); /* put together record */
|
---|
| 489 | strcat(out_record, directory);
|
---|
| 490 | strcat(out_record, field_001);
|
---|
| 491 | strcat(out_record, field_008);
|
---|
| 492 | strcat(out_record, data_field);
|
---|
| 493 |
|
---|
| 494 | return out_record;
|
---|
| 495 | }
|
---|