shithub: scc

ref: 08b0f2a554d8e1d8b651ae0d25947104604e5df9
dir: /lex.c/

View raw version

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>

#include "cc.h"
#include "tokens.h"
#include "symbol.h"
#include "types.h"


static FILE *yyin;
union yyval yyval;
static unsigned char aheadtok = NOTOK;
unsigned char yytoken;
unsigned char yyhash;
char yytext[TOKSIZ_MAX + 1];
unsigned linenum;
unsigned columnum;
const char *filename;


static char number(void)
{
	register char *bp;
	register char ch;
	register struct symbol *sym;

	for (bp = yytext; bp < yytext + TOKSIZ_MAX; *bp++ = ch) {
		if (!isdigit(ch = getc(yyin)))
			break;
	}
	if (bp == yytext + TOKSIZ_MAX)
		error("identifier too long %s", yytext);
	*bp = '\0';
	ungetc(ch, yyin);
	yyval.sym = sym = install(NULL, 0);
	sym->val = atoi(yytext);

	return CONSTANT;
}

static unsigned char iden(void)
{
	register char ch;
	register char *bp = yytext;
	register struct symbol *sym;

	for (yyhash = 0; bp < yytext + TOKSIZ_MAX; *bp++ = ch) {
		if (!isalnum(ch = getc(yyin)) && ch != '_')
			break;
		yyhash += ch;
	}
	if (bp == yytext + TOKSIZ_MAX)
		error("identifier too long %s", yytext);
	*bp = '\0';
	ungetc(ch, yyin);
	if ((sym = lookup(yytext, yyhash)) && sym->ns == NS_KEYWORD)
		return sym->tok;
	yyval.sym = sym;
	return IDEN;
}

static unsigned char skip(void)
{
	register int c;
	extern char parser_out_home;

	while (isspace(c = getc(yyin))) {
		if (c == '\n')
			++linenum, columnum = 1;
		else
			++columnum;
	}
	if (c == EOF) {
		if (parser_out_home)
			error("Find EOF while parsing");
		return 0;
	}
	ungetc(c, yyin);
	return 1;
}

static unsigned char
follow(unsigned char op, unsigned char eq, unsigned char rep)
{
	register char c;

	if ((c = getc(yyin)) == '=')
		return eq;
	else if (c == op && rep)
		return rep;
	ungetc(c, yyin);
	return op;
}

static unsigned char rel_shift(unsigned char op)
{
	static char tokens[2][3] = {
		{GE, SHL, SHL_EQ},
		{LE, SHR, SHR_EQ}};
	register char c;
	register char *tp = tokens[op == '>'];

	if ((c = getc(yyin)) == '=') {
		return tp[0];
	} else if (c == op) {
		if ((c = getc(yyin)) == '=')
			return tp[2];
		op = tp[1];
	}
	ungetc(c, yyin);
	return c;
}

static unsigned char minus(void)
{
	register int c;

	switch (c = getc(yyin)) {
	case '-': return DEC;
	case '>': return PTR;
	case '=': return SUB_EQ;
	default:
		ungetc(c, yyin);
		return '-';
	}
}

void next(void)
{
	register unsigned char c;

	if (aheadtok != NOTOK) {
		yytoken = aheadtok;
		aheadtok = NOTOK;
	} else if (!skip()) {
		yytoken = EOFTOK;
	} else if (isalpha(c = getc(yyin)) || c == '_') {
		ungetc(c, yyin);
		yytoken = iden();
	} else if (isdigit(c)) {
		ungetc(c, yyin);
		yytoken = number();
	} else {
		switch (c) {
		case '=': yytoken = follow('=', EQ, 0); break;
		case '^': yytoken = follow('^', XOR_EQ, 0); break;
		case '*': yytoken = follow('*', MUL_EQ, 0); break;
		case '!': yytoken = follow('!', NE, 0); break;
		case '+': yytoken = follow('+', ADD_EQ, INC); break;
		case '&': yytoken = follow('&', AND_EQ, AND); break;
		case '|': yytoken = follow('|', OR_EQ, OR); break;
		case '<': yytoken = rel_shift('<'); break;
		case '>': yytoken = rel_shift('>'); break;
		case '-': yytoken = minus(); break;
		default: yytoken = c;
		}
	}
}

unsigned char ahead(void)
{
	static unsigned char oldtok;

	oldtok = yytoken;
	next();
	aheadtok = yytoken;
	yytoken = oldtok;
	return aheadtok;
}

char accept(register unsigned char tok)
{
	if (yytoken == tok) {
		next();
		return 1;
	}
	return 0;
}

void expect(register unsigned char tok)
{
	if (yytoken != tok)
		error("unexpected %s", yytext);
	next();
}

void open_file(register const char *file)
{
	if (yyin != NULL)
		fclose(yyin);
	if (file == NULL) {
		yyin = stdin;
		filename = "(stdin)";
		return;
	}
	if ((yyin = fopen(file, "r")) == NULL)
		die("file '%s' not found", file);
	filename = file;
	columnum = linenum = 1;
}