/* * (c) copyright 1987 by the Vrije Universiteit, Amsterdam, The Netherlands. * See the copyright notice in the ACK home directory, in the file "Copyright". */ /* $Header$ */ /* IDENTIFIER FIDDLING & SYMBOL TABLE HANDLING */ #include "lint.h" #include #include "debug.h" #include "idfsize.h" #include "botch_free.h" #include "nopp.h" #include "nparams.h" #include #include "arith.h" #include "align.h" #include "LLlex.h" #include "level.h" #include "stack.h" #include "idf.h" #include "label.h" #include "def.h" #include "type.h" #include "proto.h" #include "struct.h" #include "declar.h" #include "decspecs.h" #include "sizes.h" #include "Lpars.h" #include "assert.h" #include "specials.h" /* registration of special identifiers */ int idfsize = IDFSIZE; extern char options[]; extern arith NewLocal(); char sp_occurred[SP_TOTAL+1]; /* indicate occurrence of special id */ struct idf *idf_hashtable[HASHSIZE]; /* All identifiers can in principle be reached through idf_hashtable; idf_hashtable[hc] is the start of a chain of idf's whose tags all hash to hc. Each idf is the start of a chain of def's for that idf, sorted according to level, with the most recent one on top. Any identifier occurring on a level is entered into this list, regardless of the nature of its declaration (variable, selector, structure tag, etc.). */ struct idf * idf_hashed(tg, size, hc) char *tg; int size; /* includes the '\0' character */ int hc; { /* The tag tg with length size and known hash value hc is looked up in the identifier table; if not found, it is entered. A pointer to it is returned. The identifier has already been truncated to idfsize characters. */ register struct idf **hook = &idf_hashtable[hc], *notch; while ((notch = *hook)) { register char *s1 = tg; register char *cp = notch->id_text; register int cmp; while (!(cmp = (*s1 - *cp++))) { if (*s1++ == '\0') { break; } } if (cmp < 0) break; if (cmp == 0) { /* suppose that special identifiers, as "__setjmp", are already inserted */ sp_occurred[notch->id_special] = 1; return notch; } hook = ¬ch->next; } /* a new struct idf must be inserted at the hook */ notch = new_idf(); notch->next = *hook; *hook = notch; /* hooked in */ notch->id_text = Salloc(tg, (unsigned) size); #ifndef NOPP /* notch->id_resmac = 0; */ #endif NOPP return notch; } #ifdef DEBUG hash_stat() { if (options['h']) { register int i; print("Hash table tally:\n"); for (i = 0; i < HASHSIZE; i++) { register struct idf *notch = idf_hashtable[i]; int cnt = 0; while (notch) { cnt++; notch = notch->next; } print("%d %d\n", i, cnt); } print("End hash table tally\n"); } } #endif DEBUG struct idf * str2idf(tg) char tg[]; { /* str2idf() returns an entry in the symbol table for the identifier tg. If necessary, an entry is created. It is used where the text of the identifier is available but its hash value is not; otherwise idf_hashed() is to be used. */ register char *cp = tg; register int hash; register int pos = -1; register int ch; char ntg[IDFSIZE + 1]; register char *ncp = ntg; hash = STARTHASH(); while (++pos < idfsize && (ch = *cp++)) { *ncp++ = ch; hash = ENHASH(hash, ch); } hash = STOPHASH(hash); *ncp++ = '\0'; return idf_hashed(ntg, (int) (ncp - ntg), hash); } struct idf * gen_idf() { /* A new idf is created out of nowhere, to serve as an anonymous name. */ static int name_cnt; char buff[100]; sprint(buff, "#%d in %s, line %u", ++name_cnt, dot.tk_file, dot.tk_line); return str2idf(buff); } int is_anon_idf(idf) struct idf *idf; { return idf->id_text[0] == '#'; } declare_idf(ds, dc, lvl) struct decspecs *ds; struct declarator *dc; { /* The identifier inside dc is declared on the level lvl, with properties deduced from the decspecs ds and the declarator dc. The level is given explicitly to be able to insert, e.g., labels on the outermost level inside the function. This routine implements the rich semantics of C declarations. */ register struct idf *idf = dc->dc_idf; register int sc = ds->ds_sc; /* This local copy is essential: char b(), c; makes b GLOBAL and c AUTO. */ register struct def *def = idf->id_def; /* may be NULL */ register struct type *type; struct stack_level *stl = stack_level_of(lvl); char formal_array = 0; /* determine the present type */ if (ds->ds_type == 0) { /* at the L_FORMAL1 level there is no type specified yet */ ASSERT(lvl == L_FORMAL1); type = int_type; /* may change at L_FORMAL2 */ } else { /* combine the decspecs and the declarator into one type */ type = declare_type(ds->ds_type, dc); if (type->tp_size <= (arith)0 && actual_declaration(sc, type)) { if (type->tp_size == (arith) -1) { /* the type is not yet known, but it has to be: */ extern char *symbol2str(); if (type->tp_fund != VOID) error("unknown %s-type", symbol2str(type->tp_fund)); else error("void is not a complete type"); } else if (type->tp_fund != LABEL) { /* CJ */ strict("%s has size 0", idf->id_text); } } } /* some additional work for formal definitions */ if (lvl == L_FORMAL2) { switch (type->tp_fund) { case FUNCTION: warning("%s is a function; cannot be formal", idf->id_text); type = construct_type(POINTER, type, 0, (arith)0, NO_PROTO); break; case ARRAY: /* 3.7.1 */ type = construct_type(POINTER, type->tp_up, 0, (arith)0, NO_PROTO); formal_array = 1; break; case FLOAT: case CHAR: case SHORT: /* The conversion is done in formal_cvt(). It is * not done when the type is float and there is a * prototype. */ break; } } /* The tests on types, postponed from do_decspecs(), can now be performed. */ /* update the storage class */ if (type && type->tp_fund == FUNCTION) { if (lvl != L_GLOBAL) { /* 3.5.1 */ if (sc == 0) sc = GLOBAL; else if (sc != EXTERN && sc != IMPLICIT) { error("illegal storage class %s for function with block-scope" , symbol2str(sc)); ds->ds_sc = sc = GLOBAL; } } else if (sc == 0) sc = GLOBAL; } else /* non-FUNCTION */ if (sc == 0) sc = lvl == L_GLOBAL ? GLOBAL : lvl == L_FORMAL1 || lvl == L_FORMAL2 ? FORMAL : AUTO; /* is it a universal typedef? */ if (def && def->df_level == L_UNIVERSAL) warning("redeclaring reserved word %s", idf->id_text); #ifdef LINT if ( def && def->df_level < lvl && !( lvl == L_FORMAL2 || def->df_level == L_UNIVERSAL || sc == GLOBAL || sc == EXTERN ) ) { /* there is already a definition for this non-extern name on a more global level */ warning("%s is already defined as a %s", idf->id_text, def->df_level == L_GLOBAL ? "global" : def->df_level == L_FORMAL2 ? "formal" : "more global local" ); } #endif LINT if ((def && ( def->df_level == lvl || ( lvl != L_GLOBAL && def->df_level > lvl ) )) || (lvl == L_GLOBAL && def && def->df_level == L_PROTO && def->next && def->next->df_level == L_GLOBAL) ) { /* There is already a declaration for idf on this level, or even more inside. The rules differ for different levels. */ switch (lvl) { case L_GLOBAL: global_redecl(idf, sc, type); def->df_file = idf->id_file; def->df_line = idf->id_line; break; case L_FORMAL1: /* formal declaration */ error("formal %s redeclared", idf->id_text); break; case L_FORMAL2: /* formal definition */ default: /* local */ error("%s redeclared", idf->id_text); break; } } else /* the idf is unknown on this level */ if (lvl == L_FORMAL2 && sc != ENUM && good_formal(def, idf)) { /* formal declaration, update only */ def->df_type = type; def->df_formal_array = formal_array; def->df_sc = sc; def->df_level = L_FORMAL2; /* CJ */ def->df_file = idf->id_file; def->df_line = idf->id_line; } #if 0 /* be more strict in scope (at least for now) */ else if ( lvl >= L_LOCAL && (type->tp_fund == FUNCTION || sc == EXTERN) ) { /* extern declaration inside function is treated the same way as global extern declaration */ if (sc == STATIC && type->tp_fund == FUNCTION) if (!is_anon_idf(idf)) warning("non-global static function %s", idf->id_text); declare_idf(ds, dc, L_GLOBAL); } #endif else { /* fill in the def block */ register struct def *newdef = new_def(); newdef->next = def; newdef->df_level = lvl; newdef->df_type = type; newdef->df_sc = sc; newdef->df_file = idf->id_file; newdef->df_line = idf->id_line; #ifdef LINT newdef->df_set = (type->tp_fund == ARRAY); /* newdef->df_firstbrace = 0; */ #endif LINT /* link it into the name list in the proper place */ idf->id_def = newdef; update_ahead(idf); stack_idf(idf, stl); /* We now calculate the address. Globals have names and don't get addresses, they get numbers instead (through data_label()). Formals are handled by declare_formals(). So here we hand out local addresses only. */ if (lvl >= L_LOCAL) { ASSERT(sc); switch (sc) { case REGISTER: case AUTO: if (type->tp_size == (arith)-1 && type->tp_fund != ARRAY) { error("size of local %s unknown", idf->id_text); /** type = idf->id_def->df_type = int_type; **/ } newdef->df_address = NewLocal(type->tp_size, type->tp_align, regtype(type), sc); break; case STATIC: newdef->df_address = (arith) data_label(); break; } } } } actual_declaration(sc, tp) int sc; struct type *tp; { /* An actual_declaration needs space, right here and now. */ register int fund = tp->tp_fund; if (sc == ENUM || sc == TYPEDEF) /* virtual declarations */ return 0; if (fund == FUNCTION || fund == ARRAY) /* allocation solved in other ways */ return 0; /* to be allocated */ return 1; } global_redecl(idf, new_sc, tp) register struct idf *idf; struct type *tp; { /* A global identifier may be declared several times, provided the declarations do not conflict; they might conflict in type (or supplement each other in the case of an array) or they might conflict or supplement each other in storage class. */ register struct def *def = idf->id_def; while (def->df_level != L_GLOBAL) def = def->next; if (!equal_type(tp, def->df_type, 0)) { error("redeclaration of %s with different type", idf->id_text); return; } else update_proto(tp, def->df_type); if (tp->tp_fund == ARRAY) { /* Multiple array declaration; this may be interesting */ if (tp->tp_size < 0) { /* new decl has [] */ /* nothing new */ } else if (def->df_type->tp_size < 0) { /* old decl has [] */ def->df_type = tp; } } /* Now we may be able to update the storage class. Clean out this mess as soon as we know all the possibilities for new_sc. For now we have: EXTERN: we have seen the word "extern" GLOBAL: the item was declared on the outer level, without either "extern" or "static". STATIC: we have seen the word "static" IMPLICIT: function declaration inferred from call */ if (new_sc == IMPLICIT) return; /* no new information */ switch (def->df_sc) { /* the old storage class */ case EXTERN: switch (new_sc) { /* the new storage class */ case EXTERN: case GLOBAL: break; case STATIC: warning("redeclaration of %s to static ignored" , idf->id_text); break; default: crash("bad storage class"); /*NOTREACHED*/ } break; case GLOBAL: switch (new_sc) { /* the new storage class */ case EXTERN: def->df_sc = EXTERN; break; case GLOBAL: break; case STATIC: warning("redeclaration of %s to static ignored" , idf->id_text); break; default: crash("bad storage class"); /*NOTREACHED*/ } break; case STATIC: switch (new_sc) { /* the new storage class */ case GLOBAL: warning("%s redeclared extern", idf->id_text); def->df_sc = new_sc; break; case EXTERN: /* complain at definition */ break; case STATIC: break; default: crash("bad storage class"); /*NOTREACHED*/ } break; case IMPLICIT: switch (new_sc) { /* the new storage class */ case EXTERN: case GLOBAL: def->df_sc = new_sc; break; case STATIC: def->df_sc = new_sc; break; default: crash("bad storage class"); /*NOTREACHED*/ } break; case ENUM: case TYPEDEF: error("illegal redeclaration of %s", idf->id_text); break; default: crash("bad storage class"); /*NOTREACHED*/ } } int good_formal(def, idf) register struct def *def; register struct idf *idf; { /* Succeeds if def is a proper L_FORMAL1 definition and gives an error message otherwise. */ if (!def || def->df_level != L_FORMAL1) { /* not in parameter list */ if (!is_anon_idf(idf)) error("%s not in parameter list", idf->id_text); return 0; } ASSERT(def->df_sc == FORMAL); /* CJ */ return 1; } declare_params(dc) struct declarator *dc; { /* Declares the formal parameters if they exist. */ register struct formal *fm = dc->dc_formal; while (fm) { declare_parameter(fm->fm_idf); fm = fm->next; } } init_idf(idf) register struct idf *idf; { /* The topmost definition of idf is set to initialized. */ register struct def *def = idf->id_def; /* the topmost */ while (def->df_level <= L_PROTO) def = def->next; if (def->df_initialized) error("multiple initialization of %s", idf->id_text); if (def->df_sc == TYPEDEF) { warning("typedef cannot be initialized"); def->df_sc = EXTERN; /* ??? *//* What else ? */ } def->df_initialized = 1; } declare_parameter(idf) struct idf *idf; { /* idf is declared as a formal. */ add_def(idf, FORMAL, int_type, level); } declare_enum(tp, idf, l) struct type *tp; struct idf *idf; arith l; { /* idf is declared as an enum constant with value l. */ add_def(idf, ENUM, tp, level); idf->id_def->df_address = l; } check_formals(idf, dc) struct idf *idf; struct declarator *dc; { register struct formal *fm = dc->dc_formal; register struct proto *pl = idf->id_def->df_type->tp_proto; register struct decl_unary *du = dc->dc_decl_unary; if (!du) { /* error or typdef'ed function */ error("illegal definition of %s", idf->id_text); return; } while (du && du->du_fund != FUNCTION) du = du->next; if (!du) return; /* terrible error, signalled earlier */ if (du->du_proto) return; if (pl) { /* Don't give a warning about an old-style definition, * since the arguments will be checked anyway. */ if (pl->pl_flag & PL_ELLIPSIS) { if (!(du->du_proto) && !(pl->pl_flag & PL_ERRGIVEN)) error("ellipsis terminator in previous declaration"); pl = pl->next; } else if (pl->pl_flag & PL_VOID) { pl = pl->next; /* should be 0 */ } while(fm && pl) { if (!equal_type(promoted_type(fm->fm_idf->id_def->df_type) , pl->pl_type, -1)) { if (!(pl->pl_flag & PL_ERRGIVEN)) error("incorrect type for parameter %s" , fm->fm_idf->id_text); pl->pl_flag |= PL_ERRGIVEN; } fm = fm->next; pl = pl->next; } if (pl || fm) { error("incorrect number of parameters"); } } else { /* make a pseudo-prototype */ register struct proto *lpl = new_proto(); if (!options['o']) warning("'%s' old-fashioned function definition" , dc->dc_idf->id_text); while (fm) { if (pl == 0) pl = lpl; else { lpl->next = new_proto(); lpl = lpl->next; } lpl->pl_flag = PL_FORMAL; lpl->pl_idf = fm->fm_idf; lpl->pl_type = promoted_type(fm->fm_idf->id_def->df_type); fm = fm->next; } if (pl == 0) { /* make func(void) */ pl = lpl; pl->pl_type = void_type; pl->pl_flag = PL_FORMAL | PL_VOID; } idf->id_def->df_type->tp_pseudoproto = pl; } free_formals(dc->dc_formal); dc->dc_formal = 0; } declare_formals(idf, fp) struct idf *idf; arith *fp; { /* Declares those formals as int that haven't been declared by the user. An address is assigned to each formal parameter. The total size of the formals is returned in *fp; */ register struct stack_entry *se = stack_level_of(L_FORMAL1)->sl_entry; arith f_offset = (arith)0; register int nparams = 0; int hasproto = idf->id_def->df_type->tp_proto != 0; #ifdef DEBUG if (options['t']) dumpidftab("start declare_formals", 0); #endif DEBUG while (se) { register struct def *def = se->se_idf->id_def; /* this stacklevel may also contain tags. ignore them */ if (!def || def->df_level < L_FORMAL1 ) { se = se->next; continue; } def->df_address = f_offset; /* the alignment convention for parameters is: align on word boundaries, i.e. take care that the following parameter starts on a new word boundary. */ f_offset = align(f_offset + def->df_type->tp_size, (int) word_size); /* cvt int to char or short and double to float, if necessary */ formal_cvt(hasproto, def); se = se->next; def->df_level = L_FORMAL2; /* CJ */ RegisterAccount(def->df_address, def->df_type->tp_size, regtype(def->df_type), def->df_sc); if (nparams++ >= STDC_NPARAMS) strict("number of formal parameters exceeds ANSI limit"); } *fp = f_offset; } int regtype(tp) struct type *tp; { switch(tp->tp_fund) { case INT: case LONG: return reg_any; case FLOAT: case DOUBLE: case LNGDBL: return reg_float; case POINTER: return reg_pointer; } return -1; } add_def(idf, sc, tp, lvl) struct idf *idf; struct type *tp; int lvl; int sc; { /* The identifier idf is declared on level lvl with storage class sc and type tp, through a faked C declaration. This is probably the wrong way to structure the problem, but it will have to do for the time being. */ struct decspecs Ds; struct declarator Dc; Ds = null_decspecs; Ds.ds_type = tp; Ds.ds_sc = sc; Dc = null_declarator; Dc.dc_idf = idf; declare_idf(&Ds, &Dc, lvl); } update_ahead(idf) register struct idf *idf; { /* The tk_symb of the token ahead is updated in the light of new information about the identifier idf. */ register int tk_symb = AHEAD; if ( (tk_symb == IDENTIFIER || tk_symb == TYPE_IDENTIFIER) && ahead.tk_idf == idf ) AHEAD = idf->id_def && idf->id_def->df_sc == TYPEDEF ? TYPE_IDENTIFIER : IDENTIFIER; } free_formals(fm) register struct formal *fm; { while (fm) { struct formal *tmp = fm->next; free_formal(fm); fm = tmp; } }