OpenXM/src/ox_toolkit/parse.c - diff

Return to parse.c CVS log

Up to [local] / OpenXM / src / ox_toolkit

Diff for /OpenXM/src/ox_toolkit/parse.c between version 1.1 and 1.14

version 1.1, 1999/12/09 22:44:56

version 1.14, 2003/06/02 10:25:57

Line 1

/* -*- mode: C; coding: euc-japan -*- */

/* $OpenXM$ */

/* $OpenXM: OpenXM/src/ox_toolkit/parse.c,v 1.13 2003/03/30 08:05:23 ohara Exp $ */

/* OX expression, CMO expression パーサ */

This module is a parser for OX/CMO expressions.

Some commnets are written in Japanese by using the EUC-JP coded

character set.

#include <stdio.h>

#include <stdlib.h>

#include <string.h>

#include <sys/param.h>

#include <setjmp.h>

#include "oxtag.h"

#include <ctype.h>

#include "ox.h"

#include "ox_toolkit.h"

#include "parse.h"

/* --- 構文解析部 --- */

/* --- Parser --- */

/* (重要)セマンティックスについての注意.

/* Remarks for semantics.

CMO_LIST, CMO_STRING は、あらかじめ与えられた要素の個数を無視する.

CMO_MONOMIAL32 は無視しない. (つまりおかしいときは構文エラーになる)

/* parse.c, lex.c では, Lisp 表現された CMO 文字列を読み込み,

parse.c では, Lisp 表現された CMO 文字列を読み込み,

バイト列を出力する. 中間表現として、cmo 構造体を利用する.

parse() はトークンの列から cmo 構造体を生成し、そのポインタを返す.

重要なことはパーサ(の各サブルーチン)は

/* 重要なことはパーサ(の各サブルーチン)は

常にトークンをひとつ先読みしていると言うことである.

Line 36 static union{

Line 40 static union{

char *sym;

} yylval;

/* pflag_cmo_addrev がセットされていれば、厳密には CMO expression では

ないもの, 例えば (CMO_STRING, "hello") も CMO に変換される. */

If `pflag_cmo_addrev' sets, then we admit extended CMO expressions.

For example, (CMO_STRING, "hello") is not a real CMO expression

but it is admitted.

static int pflag_cmo_addrev = 1;

static int pflag_cmo_addrev = 1; /* CMO の省略記法を許すか否かのフラグ */

/* definitions of local functions */

static void parse_error(char *s);

/* 関数の宣言 */

static void parse_right_parenthesis();

static int parse_error(char *s);

static void parse_left_parenthesis();

static int parse_lf();

static void parse_comma();

static int parse_right_parenthesis();

static mpz_ptr parse_mpz_integer();

static int parse_left_parenthesis();

static int parse_integer();

static int parse_comma();

static int parse_integer();

static char *parse_string();

static cmo *parse_cmo_null();

static cmo *parse_cmo_int32();

Line 67 static int parse_sm();

Line 73 static int parse_sm();

static ox *parse_ox();

static ox *parse_ox_command();

static ox *parse_ox_data();

static void init_lex(char *s);

static int lex();

static int is_token_cmo(int token)

{

return (token >= MIN_T_CMO && token < MAX_T_CMO) || token == TOKEN(CMO_ERROR2);

Line 85 static int is_token_ox(int token)

Line 94 static int is_token_ox(int token)

static jmp_buf env_parse;

/* 構文解析に失敗したことを意味する. */

/* This is a parsing fault. */

static int parse_error(char *s)

static void parse_error(char *s)

{

fprintf(stderr, "syntax error: %s\n", s);

ox_printf("syntax error: %s\n", s);

longjmp(env_parse, 1);

}

/* この部分は書き換え予定. */

void setflag_parse(int flag)

{

pflag_cmo_addrev = flag;

}

void init_parser(char *s)

{

setflag_parse(PFLAG_ADDREV);

init_lex(s);

}

cmo *parse()

{

cmo *m;

if (setjmp(env_parse) != 0) {

return NULL; /* 構文解析に失敗したら NULL を返す. */

return NULL;

/* This is an error. */

}

do{

token = lex();

}while (token == '\n');

if (token == '(') {

token = lex();

if (is_token_cmo(token)) {

Line 114 cmo *parse()

Line 131 cmo *parse()

}else {

parse_error("invalid symbol.");

}

parse_lf();

return m;

}

return NULL;

}

/* トークンを先読みしない(重要). */

static int parse_lf()

{

if (token != '\n') {

parse_error("no new line.");

}

return 0;

}

static ox *parse_ox()

{

ox *m = NULL;

Line 183 static int parse_sm()

Line 189 static int parse_sm()

return sm_code;

}

/* 正しい入力ならば, parse_cmo を呼ぶ時点で, token には

TOKEN(CMO_xxx), TOKEN(OX_xxx) のいずれかがセットされている. */

static cmo *parse_cmo()

{

cmo *m = NULL;

Line 249 static cmo *parse_cmo()

Line 252 static cmo *parse_cmo()

return m;

}

static int parse_left_parenthesis()

static void parse_left_parenthesis()

{

if (token != '(') {

parse_error("no left parenthesis.");

Line 257 static int parse_left_parenthesis()

Line 260 static int parse_left_parenthesis()

token = lex();

}

static int parse_right_parenthesis()

static void parse_right_parenthesis()

{

if (token != ')') {

parse_error("no right parenthesis.");

Line 265 static int parse_right_parenthesis()

Line 268 static int parse_right_parenthesis()

token = lex();

}

static int parse_comma()

static void parse_comma()

{

if (token != ',') {

parse_error("no comma.");

Line 273 static int parse_comma()

Line 276 static int parse_comma()

token = lex();

}

static mpz_ptr new_mpz_set_str(char *s)

{

mpz_ptr z = MALLOC(sizeof(mpz_t));

mpz_init_set_str(z, s, 10);

return z;

}

static mpz_ptr my_mpz_neg(mpz_ptr src)

{

mpz_ptr z = MALLOC(sizeof(mpz_t));

mpz_init(z);

mpz_neg(z, src);

return z;

}

static mpz_ptr parse_mpz_integer()

{

int sign = 1;

mpz_ptr val;

if (token == '+') {

token = lex();

}else if (token == '-') {

sign = -1;

token = lex();

}

if (token != T_DIGIT) {

parse_error("no integer.");

}

val = new_mpz_set_str(yylval.sym);

if (sign == -1) {

val = my_mpz_neg(val);

}

token = lex();

return val;

}

static int parse_integer()

{

#if 0

return mpz_get_si(parse_mpz_integer());

#else

int sign = 1;

int val;

if (token != T_INTEGER) {

if (token == '+') {

token = lex();

}else if (token == '-') {

sign = -1;

token = lex();

}

if (token != T_DIGIT) {

parse_error("no integer.");

}

val = yylval.d;

val = sign*atoi(yylval.sym);

token = lex();

return val;

#endif

}

static char *parse_string()

Line 303 static cmo *parse_cmo_null()

Line 357 static cmo *parse_cmo_null()

static cmo *parse_cmo_int32()

{

int i;

int z;

parse_comma();

i = parse_integer();

z = parse_integer();

parse_right_parenthesis();

return (cmo *)new_cmo_int32(i);

return (cmo *)new_cmo_int32(z);

}

static cmo *parse_cmo_string()

Line 317 static cmo *parse_cmo_string()

Line 371 static cmo *parse_cmo_string()

char *s;

parse_comma();

if (token == T_INTEGER) {

if (token == T_DIGIT) {

parse_integer();

parse_comma();

}else if (!pflag_cmo_addrev) {

Line 342 static cmo *parse_cmo_mathcap()

Line 396 static cmo *parse_cmo_mathcap()

static cmo *parse_cmo_list()

{

int length=0;

int i=0;

cmo_list *m = new_cmo_list();

cmo *newcmo;

if (token == ',') {

parse_comma();

if (token == T_INTEGER) {

if (token == T_DIGIT) {

parse_integer();

parse_comma();

}else if (!pflag_cmo_addrev) {

Line 360 static cmo *parse_cmo_list()

Line 412 static cmo *parse_cmo_list()

while(token == '(') {

parse_left_parenthesis();

newcmo = parse_cmo();

append_cmo_list(m, newcmo);

list_append(m, newcmo);

if (token != ',') {

break;

}

Line 376 static cmo *parse_cmo_list()

Line 428 static cmo *parse_cmo_list()

static cmo *parse_cmo_monomial32()

{

int size;

int *exps;

int i;

cmo_monomial32 *m;

int tag;

Line 397 static cmo *parse_cmo_monomial32()

Line 448 static cmo *parse_cmo_monomial32()

m->coef = parse_cmo();

tag = m->coef->tag;

/* m->coef は CMO_ZZ 型か CMO_INT32 型でなければならない */

/* semantics:

The tag of m->coef must be CMO_ZZ or CMO_INT32. */

if (tag != CMO_ZZ && tag != CMO_INT32) {

parse_error("invalid cmo.");

}

Line 405 static cmo *parse_cmo_monomial32()

Line 457 static cmo *parse_cmo_monomial32()

return (cmo *)m;

}

/* cmo_zz の内部を直接いじる. */

/* the following function rewrite internal data of mpz/cmo_zz. */

static cmo *parse_cmo_zz()

{

int length;

int i=0;

cmo_zz *m= NULL;

mpz_ptr z;

parse_comma();

length = parse_integer();

z = parse_mpz_integer();

if (token == ',') {

length = mpz_get_si(z);

m = new_cmo_zz_size(length);

length = abs(length);

Line 423 static cmo *parse_cmo_zz()

Line 477 static cmo *parse_cmo_zz()

m->mpz->_mp_d[i] = parse_integer();

}

}else if (pflag_cmo_addrev) {

m = new_cmo_zz_set_si(length);

m = new_cmo_zz_set_mpz(z);

}else {

parse_error("no comma.");

}

Line 452 static cmo *parse_cmo_ring_by_name()

Line 506 static cmo *parse_cmo_ring_by_name()

parse_left_parenthesis();

ob = parse_cmo();

/* ob は CMO_STRING 型でなければならない */

/* The ob has a type of CMO_STRING. */

if (ob->tag != CMO_STRING) {

parse_error("invalid cmo.");

}

Line 462 static cmo *parse_cmo_ring_by_name()

Line 516 static cmo *parse_cmo_ring_by_name()

static cmo *parse_cmo_distributed_polynomial()

{

int length=0;

int i=0;

cmo_distributed_polynomial *m = new_cmo_distributed_polynomial();

cmo *ob;

int tag;

Line 471 static cmo *parse_cmo_distributed_polynomial()

Line 523 static cmo *parse_cmo_distributed_polynomial()

if (token == ',') {

parse_comma();

if (token == T_INTEGER) {

if (token == T_DIGIT) {

parse_integer();

parse_comma();

}else if (!pflag_cmo_addrev) {

Line 481 static cmo *parse_cmo_distributed_polynomial()

Line 533 static cmo *parse_cmo_distributed_polynomial()

parse_left_parenthesis();

m->ringdef = parse_cmo();

tag = m->ringdef->tag;

/* m->ringdef は DringDefinition でなければならない */

/* m->ringdef needs to be a DringDefinition. */

if (tag != CMO_RING_BY_NAME && tag != CMO_DMS_GENERIC

&& tag != CMO_DMS_OF_N_VARIABLES) {

parse_error("invalid cmo.");

Line 495 static cmo *parse_cmo_distributed_polynomial()

Line 547 static cmo *parse_cmo_distributed_polynomial()

if (ob->tag != CMO_MONOMIAL32 && ob->tag != CMO_ZERO) {

parse_error("invalid cmo.");

}

append_cmo_list((cmo_list *)m, ob);

list_append((cmo_list *)m, ob);

if (token != ',') {

break;

}

Line 530 static cmo *parse_cmo_error2()

Line 582 static cmo *parse_cmo_error2()

return (cmo *)new_cmo_error2(ob);

}

/* --- 字句解析部 --- */

/* --- lexical analyzer --- */

/* lexical analyzer で読み飛ばされる文字なら何を初期値にしてもよい */

/* A white space is ignored by lexical analyzer. */

static int c = ' ';

/* 一文字読み込む関数 */

/* getting a character from string. */

static int (*GETC)() = getchar;

static char *mygetc_ptr;

static int mygetc()

int setgetc(int (*foo)())

{

GETC = foo;

return *mygetc_ptr++;

}

int resetgetc()

static void init_lex(char *s)

{

GETC = getchar;

c=' ';

mygetc_ptr=s;

}

#define SIZE_BUFFER 8192

static char buffer[SIZE_BUFFER];

/* 桁溢れの場合の対策はない */

static char *new_string(char *s)

static int lex_digit()

{

int d = 0;

char *t = MALLOC(strlen(s)+1);

do {

strcpy(t, s);

d = 10*d + (c - '0');

return t;

c = GETC();

} while(isdigit(c));

return d;

}

/* no measure for buffer overflow */

static char *lex_digit()

{

static char buff[SIZE_BUFFER];

int i;

for(i=0; i<SIZE_BUFFER-1; i++) {

if(isdigit(c)) {

buff[i] = c;

}else {

buff[i] = '\0';

return new_string(buff);

}

c = mygetc();

}

buff[SIZE_BUFFER-1] = '\0';

return new_string(buff);

}

#define MK_KEY_CMO(x) { #x , x , TOKEN(x) , IS_CMO }

#define MK_KEY_SM(x) { #x , x , TOKEN(SM) , IS_SM }

#define MK_KEY_OX(x) { #x , x , TOKEN(x) , IS_OX }

static symbol symbol_list[] = {

static struct symbol symbol_list[] = {

MK_KEY_CMO(CMO_NULL),

MK_KEY_CMO(CMO_INT32),

MK_KEY_CMO(CMO_DATUM),

Line 596 static symbol symbol_list[] = {

Line 663 static symbol symbol_list[] = {

{NULL, 0, 0, 0} /* a gate keeper */

};

symbol* lookup_by_symbol(char *key)

symbol_t lookup_by_symbol(char *key)

{

symbol *symp;

symbol_t symp;

for(symp = symbol_list; symp->key != NULL; symp++) {

if (strcmp(key, symp->key)==0) {

return symp;

Line 607 symbol* lookup_by_symbol(char *key)

Line 674 symbol* lookup_by_symbol(char *key)

return NULL;

}

symbol* lookup_by_token(int tok)

symbol_t lookup_by_token(int tok)

{

symbol *symp;

symbol_t symp;

for(symp = symbol_list; symp->key != NULL; symp++) {

if (tok == symp->token) {

return symp;

Line 618 symbol* lookup_by_token(int tok)

Line 685 symbol* lookup_by_token(int tok)

return NULL;

}

symbol* lookup_by_tag(int tag)

symbol_t lookup_by_tag(int tag)

{

symbol *symp;

symbol_t symp;

for(symp = symbol_list; symp->key != NULL; symp++) {

if (tag == symp->tag) {

return symp;

Line 629 symbol* lookup_by_tag(int tag)

Line 696 symbol* lookup_by_tag(int tag)

return NULL;

}

symbol* lookup(int i)

symbol_t lookup(int i)

{

return &symbol_list[i];

}

/* バッファあふれした場合の対策をちゃんと考えるべき */

char *get_symbol_by_tag(int tag)

{

symbol_t symp = lookup_by_tag(tag);

return (symp != NULL)? symp->key: NULL;

}

/* no measure for buffer overflow */

static char *lex_quoted_string()

{

int i;

char c0 = ' ';

char *s = NULL;

for (i=0; i<SIZE_BUFFER; i++) {

c = GETC();

c = mygetc();

if(c == '"') {

s = malloc(i+1);

c = mygetc();

buffer[i]='\0';

strcpy(s, buffer);

return new_string(buffer);

c = GETC();

return s;

}else if (c == '\\') {

c0 = c;

c = GETC();

c = mygetc();

if (c != '"') {

buffer[i++] = c0;

}

buffer[i]=c;

}

fprintf(stderr, "buffer overflow!\n");

ox_printf("buffer overflow!\n");

exit(1);

/* return NULL; */

}

static int token_of_symbol(char *key)

{

symbol *symp = lookup_by_symbol(key);

symbol_t symp = lookup_by_symbol(key);

if (symp != NULL) {

yylval.d = symp->tag;

return symp->token;

}

#if DEBUG

ox_printf("lex error:: \"%s\" is unknown symbol.\n", key);

fprintf(stderr, "lex error:: \"%s\" is unknown symbol.\n", key);

#endif

return 0;

}

Line 685 static int lex_symbol()

Line 753 static int lex_symbol()

return token_of_symbol(buffer);

}

buffer[i]=c;

c = GETC();

c = mygetc();

}

fprintf(stderr, "buffer overflow!\n");

ox_printf("buffer overflow!\n");

return 0;

}

/* return する前に一文字先読みしておく. */

/* Remark: prefetching a character before return. */

int lex()

static int lex()

{

int c_dash = 0;

/* 空白をスキップする. */

/* white spaces are ignored. */

while (isspace(c) && c != '\n') {

while (isspace(c)) {

c = GETC();

c = mygetc();

}

switch(c) {

case '(':

case ')':

case ',':

case '\n':

case '+':

case '-':

c_dash = c;

c = ' ';

return c_dash;

case EOF:

c = GETC();

c = mygetc();

return c_dash;

case '"': /* a quoted string! */

yylval.sym = lex_quoted_string();

Line 718 int lex()

Line 787 int lex()

default:

}

if (isalpha(c)) { /* 識別子 */

if (isalpha(c)) {

/* symbols */

return lex_symbol();

}

/* 32bit 整数値 */

/* digit */

if (isdigit(c)){

yylval.d = lex_digit();

yylval.sym = lex_digit();

return T_INTEGER;

return T_DIGIT;

}

if (c == '-') {

c = mygetc();

c = GETC();

while (isspace(c) && c != '\n') {

c = GETC();

}

if (isdigit(c)){

yylval.d = - lex_digit();

return T_INTEGER;

}

return 0;

}

c = GETC();

return 0;

}

/* 一文字読み込む関数 */

static char *mygetc_line;

static int mygetc_counter;

static int mygetc_counter_max;

static int mygetc_nonlf_flag;

int mygetc()

{

int c = '\0';

if (mygetc_nonlf_flag && mygetc_counter <= mygetc_counter_max) {

c = mygetc_line[mygetc_counter++];

if (c == '\0') {

c = '\n';

mygetc_nonlf_flag = 0;

}

return c;

}

int setmode_mygetc(char *s, int len)

{

mygetc_nonlf_flag=1;

mygetc_counter=0;

mygetc_counter_max=len;

mygetc_line=s;

}

int setflag_parse(int flag)

{

pflag_cmo_addrev = flag;

}

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>