/*
$Id: marcomp.c,v 1.2 2003/02/28 14:34:37 adam Exp $
marcomp.c - compiler of MARC statements.
*/
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <yaz/yaz-util.h>
#include "marcomp.h"
static mc_token mc_gettoken(mc_context *c);
static void mc_ungettoken(mc_context *c);
static int mc_getval(mc_context *c);
static int mc_getdata(mc_context *c, char *s, int sz);
static void mc_getinterval(mc_context *c, int *start, int *end);
static mc_subfield *mc_mk_subfield(mc_subfield *parent);
static mc_field *mc_mk_field(void);
static struct mc_errmsg
{
mc_errcode code;
const char *msg;
} mc_errmsg[] = {
{EMCOK, "OK"},
{EMCNOMEM, "NO mem"},
{EMCF, "not complete field"},
{EMCSF, "not complete subfield"},
{EMCSFGROUP, "not closed GROUP"},
{EMCSFVAR, "not closed VARIANT"},
{EMCSFINLINE, "not closed IN-LINE"},
{EMCEND, "not correct errno"}
};
mc_errcode mc_errno(mc_context *c)
{
return c->errcode;
}
const char *mc_error(mc_errcode no)
{
if (no >= EMCOK && no<EMCEND)
return mc_errmsg[no].msg;
else
return mc_errmsg[EMCEND].msg;
}
mc_context *mc_mk_context(const char *s)
{
mc_context *p=0;
if (s && strlen(s))
{
p = (mc_context*) xmalloc(sizeof(*p));
if (!p)
return 0;
memset(p, 0, sizeof(*p));
p->errcode = EMCOK;
p->data = s;
p->len = strlen(s);
p->crrtok = NOP;
}
return p;
}
void mc_destroy_context(mc_context *c)
{
if (c) xfree(c);
}
mc_token mc_gettoken(mc_context *c)
{
if (c->offset >= c->len)
return NOP;
switch (*(c->data+c->offset))
{
case '{': c->crrtok = LVARIANT; break;
case '}': c->crrtok = RVARIANT; break;
case '(': c->crrtok = LGROUP; break;
case ')': c->crrtok = RGROUP; break;
case '<': c->crrtok = LINLINE; break;
case '>': c->crrtok = RINLINE; break;
case '$': c->crrtok = SUBFIELD; break;
case '[': c->crrtok = LINTERVAL; break;
case ']': c->crrtok = RINTERVAL; break;
default:
if (isspace(*(c->data+c->offset)) || *(c->data+c->offset) == '\n')
{
c->crrtok = NOP;
}
else
{
c->crrtok = REGULAR;
c->crrval = *(c->data+c->offset);
}
}
#ifdef DEBUG
fprintf(stderr, "gettoken(): offset: %d", c->offset);
if (c->crrtok == REGULAR)
fprintf(stderr, "<%c>", c->crrval);
fprintf(stderr, "\n");
#endif
c->offset++;
return c->crrtok;
}
void mc_ungettoken(mc_context *c)
{
if (c->offset > 0)
c->offset--;
}
int mc_getval(mc_context *c)
{
return c->crrval;
}
int mc_getdata(mc_context *c, char *s, int sz)
{
int i;
for (i=0; i<sz; i++)
{
if (mc_gettoken(c)!=REGULAR)
{
mc_ungettoken(c);
break;
}
s[i] = mc_getval(c);
}
s[i] = '\0';
return i;
}
void mc_getinterval(mc_context *c, int *start, int *end)
{
char buf[6+1];
int start_pos, end_pos;
start_pos = end_pos = -1;
if (mc_gettoken(c) == LINTERVAL)
{
int i;
for (i=0;i<6;i++)
{
mc_token tok = mc_gettoken(c);
if (tok == RINTERVAL || tok == NOP)
break;
buf[i] = mc_getval(c);
}
buf[i] = '\0';
i = sscanf(buf, "%d-%d", &start_pos, &end_pos);
if (i == 1)
end_pos = start_pos;
else if ( i == 0)
{
start_pos = 0;
}
}
*start = start_pos;
*end = end_pos;
}
mc_field *mc_mk_field(void)
{
mc_field *p = (mc_field *)xmalloc(sizeof(*p));
if (p)
{
memset(p, 0, sizeof(*p));
p->name = (char *)xmalloc(SZ_FNAME+1);
*p->name = '\0';
p->ind1 = (char *)xmalloc(SZ_IND+1);
*p->ind1 = '\0';
p->ind2 = (char *)xmalloc(SZ_IND+1);
*p->ind2 = '\0';
p->interval.start = p->interval.end = -1;
}
return p;
}
void mc_destroy_field(mc_field *p)
{
if (!p)
return;
if (p->name) xfree(p->name);
if (p->ind1) xfree(p->ind1);
if (p->ind2) xfree(p->ind2);
if (p->list) mc_destroy_subfields_recursive(p->list);
xfree(p);
}
mc_field *mc_getfield(mc_context *c)
{
mc_field *pf;
pf = mc_mk_field();
if (!pf)
{
c->errcode = EMCNOMEM;
return 0;
}
if (mc_getdata(c, pf->name, SZ_FNAME) == SZ_FNAME)
{
mc_token nexttok = mc_gettoken(c);
mc_ungettoken(c);
if (nexttok == LINTERVAL)
{
mc_getinterval(c, &pf->interval.start, &pf->interval.end);
#ifdef DEBUG
fprintf(stderr, "ineterval (%d)-(%d)\n", pf->interval.start,
pf->interval.end);
#endif
}
if ((mc_getdata(c, pf->ind1, SZ_IND) == SZ_IND) &&
(mc_getdata(c, pf->ind2, SZ_IND) == SZ_IND))
{
pf->list = mc_getsubfields(c, 0);
}
}
else
{
c->errcode = EMCF;
mc_destroy_field(pf);
return 0;
}
return pf;
}
mc_subfield *mc_mk_subfield(mc_subfield *parent)
{
mc_subfield *p = (mc_subfield*)xmalloc(sizeof(*p));
if (p)
{
memset(p, 0, sizeof(*p));
p->which = MC_SF;
p->name = (char *)xmalloc(SZ_SFNAME+1);
*p->name = '\0';
p->prefix = (char *)xmalloc(SZ_PREFIX+1);
*p->prefix = '\0';
p->suffix = (char *)xmalloc(SZ_SUFFIX+1);
*p->suffix = '\0';
p->parent = parent;
p->interval.start = p->interval.end = -1;
}
return p;
}
void mc_destroy_subfield(mc_subfield *p)
{
if (!p)
return;
if (p->which == MC_SFGROUP || p->which == MC_SFVARIANT)
{
if (p->u.child)
mc_destroy_subfields_recursive(p->u.child);
}
else if (p->which == MC_SF)
{
if (p->u.in_line)
mc_destroy_field(p->u.in_line);
}
if (p->name) xfree(p->name);
if (p->prefix) xfree(p->prefix);
if (p->suffix) xfree(p->suffix);
if (p->parent) p->parent->next = p->next;
xfree(p);
}
void mc_destroy_subfields_recursive(mc_subfield *p)
{
if (!p)
return;
mc_destroy_subfields_recursive(p->next);
if (p->which == MC_SFGROUP || p->which == MC_SFVARIANT)
{
if (p->u.child)
mc_destroy_subfields_recursive(p->u.child);
}
else if (p->which == MC_SF)
{
if (p->u.in_line)
mc_destroy_field(p->u.in_line);
}
if (p->name) xfree(p->name);
if (p->prefix) xfree(p->prefix);
if (p->suffix) xfree(p->suffix);
if (p->parent) p->parent->next = 0;
xfree(p);
}
mc_subfield *mc_getsubfields(mc_context *c, mc_subfield *parent)
{
mc_subfield *psf=0;
mc_token tok = mc_gettoken(c);
if (tok == NOP)
return 0;
if (tok == LGROUP)
{
if (!(psf = mc_mk_subfield(parent)))
{
c->errcode = EMCNOMEM;
return 0;
}
psf->which = MC_SFGROUP;
psf->u.child = mc_getsubfields(c, psf);
if (mc_gettoken(c) == RGROUP)
psf->next = mc_getsubfields(c, psf);
else
{
c->errcode = EMCSFGROUP;
mc_destroy_subfield(psf);
return 0;
}
}
else if (tok == LVARIANT)
{
if (!(psf = mc_mk_subfield(parent)))
{
c->errcode = EMCNOMEM;
return 0;
}
psf->which = MC_SFVARIANT;
psf->u.child = mc_getsubfields(c, psf);
if (mc_gettoken(c) == RVARIANT)
psf->next = mc_getsubfields(c, psf);
else
{
c->errcode = EMCSFVAR;
mc_destroy_subfield(psf);
return 0;
}
}
else if (tok == RGROUP || tok == RVARIANT || tok == RINLINE)
{
mc_ungettoken(c);
return 0;
}
else if (tok == REGULAR)
{
if (!(psf = mc_mk_subfield(parent)))
{
c->errcode = EMCNOMEM;
return 0;
}
mc_ungettoken(c);
if((mc_getdata(c, psf->prefix, SZ_PREFIX) == SZ_PREFIX) &&
(mc_gettoken(c) == SUBFIELD) &&
(mc_getdata(c, psf->name, SZ_SFNAME) == SZ_SFNAME))
{
mc_token tok = mc_gettoken(c);
mc_ungettoken(c);
if (tok == LINTERVAL)
{
mc_getinterval(c, &psf->interval.start, &psf->interval.end);
}
else if (tok == LINLINE)
{
mc_gettoken(c);
psf->u.in_line = mc_getfield(c);
if (mc_gettoken(c) != RINLINE)
{
c->errcode = EMCSFINLINE;
mc_destroy_subfield(psf);
return 0;
}
}
if (mc_getdata(c, psf->suffix, SZ_SUFFIX) == SZ_SUFFIX)
{
psf->which = MC_SF;
psf->next = mc_getsubfields(c, psf);
}
else
{
c->errcode = EMCSF;
mc_destroy_subfield(psf);
return 0;
}
}
}
return psf;
}
syntax highlighted by Code2HTML, v. 0.9.1