129 lines
		
	
	
	
		
			2.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			129 lines
		
	
	
	
		
			2.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /* L L l e x . c
 | |
|  *
 | |
|  * Very simple lexical analyzer. 
 | |
|  * Also contains LLmessage().
 | |
|  */
 | |
| # include <ctype.h>
 | |
| # include <stdio.h>
 | |
| # include "tunable.h"
 | |
| # include "token.h"
 | |
| # include "Lpars.h"
 | |
| 
 | |
| struct token dot;		/* current token */
 | |
| static struct token aside;	/* to put currrent token aside, when a token
 | |
| 				 * is inserted
 | |
| 				 */
 | |
| int	newline, lineno;	/* To keep track of linenumbers */
 | |
| extern FILE *input;		/* file descriptor of machine table */
 | |
| 
 | |
| LLlex() {
 | |
| 	register c;
 | |
| 
 | |
| 	if (aside.t_tokno) {	/* A token was pushed aside, return it now */
 | |
| 		dot = aside;
 | |
| 		aside.t_tokno = 0;
 | |
| 		return dot.t_tokno;
 | |
| 	}
 | |
| 	if (newline) {		/* delayed increment of lineno, needed to give
 | |
| 				 * correct line numbers in error messages
 | |
| 				 */
 | |
| 	    	lineno++;
 | |
| 		newline = 0;
 | |
| 	}
 | |
| 	c = getc(input);
 | |
| 	while (c == '/') {	/* Could be a comment */
 | |
| 		if ((c = getc(input)) == '*') {
 | |
| 		    		/* Yes, it is a comment */
 | |
| 			int l;
 | |
| 
 | |
| 			l = lineno;
 | |
|         		do {
 | |
| 			    do {
 | |
| 				if (c == '\n') lineno++;
 | |
| 				c = getc(input);
 | |
| 			    } while (c != '*' && c != EOF);
 | |
|                             if (c != EOF) c = getc(input);
 | |
|                         } while (c != '/' && c != EOF);
 | |
| 			if (c == EOF) {
 | |
| 			    c = lineno;
 | |
| 			    lineno = l;
 | |
| 			    error("Unterminated comment");
 | |
| 			    lineno = c;
 | |
| 			    c = EOF;
 | |
| 			}
 | |
| 			else c = getc(input);
 | |
|                 }
 | |
| 		else {
 | |
| 			ungetc(c, input);
 | |
| 			c = '/';
 | |
| 			break;
 | |
| 		}
 | |
| 	}
 | |
| 	dot.t_tokno = c;
 | |
| 	dot.t_attrib = c;
 | |
| 	if (isupper(c) || islower(c) || c == '_') {
 | |
| 		dot.t_tokno = LETTER;
 | |
| 		return LETTER;
 | |
| 	}
 | |
| 	if (isdigit(c)) {
 | |
| 		dot.t_tokno = DIGIT;
 | |
| 		return DIGIT;
 | |
| 	}
 | |
| 	switch(c) {
 | |
| 	  case line_term :
 | |
| 		dot.t_tokno = LINE_TERMINATOR;
 | |
| 		return LINE_TERMINATOR;
 | |
| 	  case operand_sep :
 | |
| 		dot.t_tokno = OPERAND_SEPARATOR;
 | |
| 		return OPERAND_SEPARATOR;
 | |
| 	  case instruction_sep :
 | |
| 		dot.t_tokno = INSTRUCTION_SEPARATOR;
 | |
| 		return INSTRUCTION_SEPARATOR;
 | |
| 	  case '-' :
 | |
| 		c = getc(input);
 | |
| 		if (c == '>') {
 | |
| 			dot.t_tokno = PATTERN_SEPARATOR;
 | |
| 			return PATTERN_SEPARATOR;
 | |
| 		}
 | |
| 		ungetc(c,input);
 | |
| 		dot.t_tokno = OTHER;
 | |
| 		return OTHER;
 | |
| 	  case open_bracket :
 | |
| 	  	dot.t_tokno = OPEN_BRACKET;
 | |
| 		return OPEN_BRACKET;
 | |
| 	  case close_bracket :
 | |
| 		dot.t_tokno = CLOSE_BRACKET;
 | |
| 		return CLOSE_BRACKET;
 | |
| 	  case '\n' :
 | |
| 		newline = 1;
 | |
| 		/* Fall through */
 | |
| 	  case ' ' :
 | |
| 	  case '\t' :
 | |
| 		dot.t_tokno = SPACE;
 | |
| 		return SPACE;
 | |
| 	  case '%' :
 | |
| 	  case EOF :
 | |
| 		return c;
 | |
| 	  default :
 | |
| 		/* Let the C-compiler find out what is illegal! */
 | |
| 		dot.t_tokno = OTHER;
 | |
| 		return OTHER;
 | |
| 	}
 | |
| }
 | |
| 
 | |
| LLmessage(d) {
 | |
|     static int savlineno;
 | |
|     
 | |
|     if (savlineno != lineno) {
 | |
| 	/* Only an error message if on another line number */
 | |
| 	savlineno = lineno;
 | |
| 	error("Syntax error");
 | |
|     }
 | |
|     if (d > 0) {
 | |
| 	/* "d" is the token to be inserted.
 | |
| 	 * This is the place to put the current token aside and
 | |
| 	 * give the inserted token an attribute ... but who cares
 | |
| 	 */
 | |
| 	aside = dot;
 | |
|     }
 | |
| }
 |