mirror of https://github.com/yasm/yasm.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
241 lines
5.4 KiB
241 lines
5.4 KiB
#include <stdlib.h> |
|
#include <string.h> |
|
#include "tools/re2c/scanner.h" |
|
#include "tools/re2c/parse.h" |
|
#include "tools/re2c/globals.h" |
|
#include "tools/re2c/parser.h" |
|
|
|
#ifndef MAX |
|
#define MAX(a,b) (((a)>(b))?(a):(b)) |
|
#endif |
|
|
|
#define BSIZE 8192 |
|
|
|
#define YYCTYPE unsigned char |
|
#define YYCURSOR cursor |
|
#define YYLIMIT s->lim |
|
#define YYMARKER s->ptr |
|
#define YYFILL(n) {cursor = fill(s, cursor);} |
|
|
|
#define RETURN(i) {s->cur = cursor; return i;} |
|
|
|
static unsigned char *fill(Scanner*, unsigned char*); |
|
|
|
void |
|
Scanner_init(Scanner *s, FILE *i) |
|
{ |
|
s->in = i; |
|
s->bot = s->tok = s->ptr = s->cur = s->pos = s->lim = s->top = |
|
s->eof = NULL; |
|
s->tchar = s->tline = 0; |
|
s->cline = 1; |
|
} |
|
|
|
static unsigned char * |
|
fill(Scanner *s, unsigned char *cursor) |
|
{ |
|
if(!s->eof){ |
|
unsigned int cnt = s->tok - s->bot; |
|
if(cnt){ |
|
memcpy(s->bot, s->tok, s->lim - s->tok); |
|
s->tok = s->bot; |
|
s->ptr -= cnt; |
|
cursor -= cnt; |
|
s->pos -= cnt; |
|
s->lim -= cnt; |
|
} |
|
if((s->top - s->lim) < BSIZE){ |
|
unsigned char *buf = malloc(((s->lim - s->bot) + BSIZE)); |
|
memcpy(buf, s->tok, s->lim - s->tok); |
|
s->tok = buf; |
|
s->ptr = &buf[s->ptr - s->bot]; |
|
cursor = &buf[cursor - s->bot]; |
|
s->pos = &buf[s->pos - s->bot]; |
|
s->lim = &buf[s->lim - s->bot]; |
|
s->top = &s->lim[BSIZE]; |
|
if (s->bot) |
|
free(s->bot); |
|
s->bot = buf; |
|
} |
|
if((cnt = fread(s->lim, 1, BSIZE, s->in)) != BSIZE){ |
|
s->eof = &s->lim[cnt]; *s->eof++ = '\0'; |
|
} |
|
s->lim += cnt; |
|
} |
|
return cursor; |
|
} |
|
|
|
/*!re2c |
|
zero = "\000"; |
|
any = [\000-\377]; |
|
dot = any \ [\n]; |
|
esc = dot \ [\\]; |
|
istring = "[" "^" ((esc \ [\]]) | "\\" dot)* "]" ; |
|
cstring = "[" ((esc \ [\]]) | "\\" dot)* "]" ; |
|
dstring = "\"" ((esc \ ["] ) | "\\" dot)* "\""; |
|
sstring = "'" ((esc \ ['] ) | "\\" dot)* "'" ; |
|
letter = [a-zA-Z]; |
|
digit = [0-9]; |
|
*/ |
|
|
|
int |
|
Scanner_echo(Scanner *s, FILE *out) |
|
{ |
|
unsigned char *cursor = s->cur; |
|
int ignore_eoc = 0; |
|
|
|
/* Catch EOF */ |
|
if (s->eof && cursor == s->eof) |
|
return 0; |
|
|
|
s->tok = cursor; |
|
echo: |
|
/*!re2c |
|
"/*!re2c" { fwrite(s->tok, 1, &cursor[-7] - s->tok, out); |
|
s->tok = cursor; |
|
RETURN(1); } |
|
"/*!max:re2c" { |
|
fprintf(out, "#define YYMAXFILL %u\n", maxFill); |
|
s->tok = s->pos = cursor; |
|
ignore_eoc = 1; |
|
goto echo; |
|
} |
|
"*" "/" { |
|
if (ignore_eoc) { |
|
ignore_eoc = 0; |
|
} else { |
|
fwrite(s->tok, 1, cursor - s->tok, out); |
|
} |
|
s->tok = s->pos = cursor; |
|
goto echo; |
|
} |
|
"\n" { fwrite(s->tok, 1, cursor - s->tok, out); |
|
s->tok = s->pos = cursor; s->cline++; oline++; |
|
goto echo; } |
|
zero { fwrite(s->tok, 1, cursor - s->tok - 1, out); /* -1 so we don't write out the \0 */ |
|
if(cursor == s->eof) { RETURN(0); } } |
|
any { goto echo; } |
|
*/ |
|
} |
|
|
|
|
|
int |
|
Scanner_scan(Scanner *s) |
|
{ |
|
unsigned char *cursor = s->cur; |
|
unsigned int depth; |
|
|
|
scan: |
|
s->tchar = cursor - s->pos; |
|
s->tline = s->cline; |
|
s->tok = cursor; |
|
/*!re2c |
|
"{" { depth = 1; |
|
goto code; |
|
} |
|
"/*" { depth = 1; |
|
goto comment; } |
|
|
|
"*/" { s->tok = cursor; |
|
RETURN(0); } |
|
|
|
dstring { s->cur = cursor; |
|
yylval.regexp = strToRE(Scanner_token(s)); |
|
return STRING; } |
|
|
|
sstring { s->cur = cursor; |
|
yylval.regexp = strToCaseInsensitiveRE(Scanner_token(s)); |
|
return STRING; } |
|
|
|
"\"" { Scanner_fatal(s, "unterminated string constant (missing \")"); } |
|
"'" { Scanner_fatal(s, "unterminated string constant (missing ')"); } |
|
|
|
istring { s->cur = cursor; |
|
yylval.regexp = invToRE(Scanner_token(s)); |
|
return RANGE; } |
|
|
|
cstring { s->cur = cursor; |
|
yylval.regexp = ranToRE(Scanner_token(s)); |
|
return RANGE; } |
|
|
|
"[" { Scanner_fatal(s, "unterminated range (missing ])"); } |
|
|
|
[()|=;/\\] { RETURN(*s->tok); } |
|
|
|
[*+?] { yylval.op = *s->tok; |
|
RETURN(CLOSE); } |
|
|
|
"{" [0-9]+ "}" { yylval.extop.minsize = atoi((char *)s->tok+1); |
|
yylval.extop.maxsize = atoi((char *)s->tok+1); |
|
RETURN(CLOSESIZE); } |
|
|
|
"{" [0-9]+ "," [0-9]+ "}" { yylval.extop.minsize = atoi((char *)s->tok+1); |
|
yylval.extop.maxsize = MAX(yylval.extop.minsize,atoi(strchr((char *)s->tok, ',')+1)); |
|
RETURN(CLOSESIZE); } |
|
|
|
"{" [0-9]+ ",}" { yylval.extop.minsize = atoi((char *)s->tok+1); |
|
yylval.extop.maxsize = -1; |
|
RETURN(CLOSESIZE); } |
|
|
|
letter (letter|digit)* { SubStr substr; |
|
s->cur = cursor; |
|
substr = Scanner_token(s); |
|
yylval.symbol = Symbol_find(&substr); |
|
return ID; } |
|
|
|
[ \t]+ { goto scan; } |
|
|
|
"\n" { if(cursor == s->eof) RETURN(0); |
|
s->pos = cursor; s->cline++; |
|
goto scan; |
|
} |
|
|
|
"." { s->cur = cursor; |
|
yylval.regexp = mkDot(); |
|
return RANGE; |
|
} |
|
|
|
any { fprintf(stderr, "unexpected character: '%c'\n", *s->tok); |
|
goto scan; |
|
} |
|
*/ |
|
|
|
code: |
|
/*!re2c |
|
"}" { if(--depth == 0){ |
|
s->cur = cursor; |
|
yylval.token = Token_new(Scanner_token(s), s->tline); |
|
return CODE; |
|
} |
|
goto code; } |
|
"{" { ++depth; |
|
goto code; } |
|
"\n" { if(cursor == s->eof) Scanner_fatal(s, "missing '}'"); |
|
s->pos = cursor; s->cline++; |
|
goto code; |
|
} |
|
dstring | sstring | any { goto code; } |
|
*/ |
|
|
|
comment: |
|
/*!re2c |
|
"*/" { if(--depth == 0) |
|
goto scan; |
|
else |
|
goto comment; } |
|
"/*" { ++depth; |
|
goto comment; } |
|
"\n" { if(cursor == s->eof) RETURN(0); |
|
s->tok = s->pos = cursor; s->cline++; |
|
goto comment; |
|
} |
|
any { goto comment; } |
|
*/ |
|
} |
|
|
|
void |
|
Scanner_fatal(Scanner *s, const char *msg) |
|
{ |
|
fprintf(stderr, "line %d, column %d: %s\n", s->tline, s->tchar + 1, msg); |
|
exit(1); |
|
}
|
|
|