+void Assemble(void)
+{
+ int state; // Keyword machine state (output)
+ int j; // Random int, must be fast
+ char * p; // Random char ptr, must be fast
+ TOKEN * tk; // First token in line
+ char * label; // Symbol (or NULL)
+ char * equate; // Symbol (or NULL)
+ int labtyp = 0; // Label type (':', DCOLON)
+ int equtyp = 0; // Equ type ('=', DEQUALS)
+ uint64_t eval; // Expression value
+ WORD eattr; // Expression attributes
+ SYM * esym; // External symbol involved in expr.
+ WORD siz = 0; // Size suffix to mnem/diretve/macro
+ LONG amsk0, amsk1; // Address-type masks for ea0, ea1
+ MNTAB * m; // Code generation table pointer
+ SYM * sy, * sy2; // Symbol (temp usage)
+ char * opname = NULL; // Name of dirctve/mnemonic/macro
+ int listflag; // 0: Don't call listeol()
+ WORD rmask; // Register list, for REG
+ int equreg; // RISC register
+ listflag = 0; // Initialise listing flag
+
+loop: // Line processing loop label
+
+ // Get another line of tokens
+ if (TokenizeLine() == TKEOF)
+ {
+DEBUG { printf("Assemble: Found TKEOF flag...\n"); }
+ if (list_flag && listflag) // Flush last line of source
+ listeol();
+
+ if (ifent->if_prev != NULL) // Check conditional token
+ error("hit EOF without finding matching .endif");
+
+ return;
+ }
+
+ DEBUG { DumpTokenBuffer(); }
+
+ if (list_flag)
+ {
+ if (listflag && listing > 0)
+ listeol(); // Tell listing generator about EOL
+
+ lstout((char)(disabled ? '-' : lntag)); // Prepare new line for listing
+ listflag = 1; // OK to call `listeol' now
+ just_bss = 0; // Reset just_bss mode
+ }
+
+ state = -3; // No keyword (just EOL)
+ label = NULL; // No label
+ label_defined = NULL; // No label defined yet
+ lab_sym = NULL; // No (exported) label
+ equate = NULL; // No equate
+ tk = tok; // Save first token in line
+ pcloc = (uint32_t)sloc; // Set beginning-of-line PC
+
+loop1: // Internal line processing loop
+
+ if (*tok == EOL) // Restart loop if end-of-line
+ goto loop;
+
+ // First token MUST be a symbol (Shamus: not sure why :-/)
+ if (*tok != SYMBOL)
+ {
+ error("syntax error; expected symbol");
+
+ goto loop;
+ }
+
+ j = (int)tok[2]; // Skip equates (normal statements)
+
+ if (j == '=' || j == DEQUALS || j == SET || j == REG || j == EQUREG || j == CCDEF)
+ {
+ equate = string[tok[1]];
+ equtyp = j;
+ tok += 3;
+ goto normal;
+ }
+
+ // Skip past label (but record it)
+ if (j == ':' || j == DCOLON)
+ {
+ label = string[tok[1]]; // Get label name
+ labtyp = tok[2]; // Get label type
+ tok += 3; // Go to next line token
+ }
+
+ // EOL is legal here...
+ if (*tok == EOL)
+ goto normal;
+
+ // First token MUST be a symbol (if we get here, tok didn't advance)
+ if (*tok++ != SYMBOL)
+ {
+ error("syntax error; expected symbol");
+ goto loop;
+ }
+
+ opname = p = string[*tok++];
+
+ // Check to see if the SYMBOL is a keyword (a mnemonic or directive).
+ // On output, `state' will have one of the values:
+ // -3 there was no symbol (EOL)
+ // -2..-1 the symbol didn't match any keyword
+ // 0..499 vanilla directives (dc, ds, etc.)
+ // 500..999 electric directives (macro, rept, etc.)
+ // 1000..+ mnemonics (move, lsr, etc.)
+ for(state=0; state>=0;)
+ {
+ j = mnbase[state] + (int)tolowertab[*p];
+
+ // Reject, character doesn't match
+ if (mncheck[j] != state)
+ {
+ state = -1; // No match
+ break;
+ }
+
+ // Must accept or reject at EOS
+ if (!*++p)
+ {
+ state = mnaccept[j]; // (-1 on no terminal match)
+ break;
+ }
+
+ state = mntab[j];
+ }
+
+ // Check for ".b" ".w" ".l" after directive, macro or mnemonic.
+ siz = SIZN;
+
+ switch (*tok)
+ {
+ case DOTW: siz = SIZW, tok++; break;
+ case DOTL: siz = SIZL, tok++; break;
+ case DOTB: siz = SIZB, tok++; break;
+ case DOTD: siz = SIZD, tok++; break;
+ case DOTP: siz = SIZP, tok++; break;
+ case DOTQ: siz = SIZQ, tok++; break;
+ case DOTS: siz = SIZS, tok++; break;
+ case DOTX: siz = SIZX, tok++; break;
+ }
+
+ // Do special directives (500..999) (These must be handled in "real time")
+ if (state >= 500 && state < 1000)
+ {
+ switch (state)
+ {
+ case MN_IF:
+ d_if();
+ goto loop;
+
+ case MN_ELSE:
+ d_else();
+ goto loop;
+
+ case MN_ENDIF:
+ d_endif();
+ goto loop;
+
+ case MN_IIF: // .iif --- immediate if
+ if (disabled || expr(exprbuf, &eval, &eattr, &esym) != OK)
+ goto loop;
+
+ if (!(eattr & DEFINED))
+ {
+ error(undef_error);
+ goto loop;
+ }
+
+ if (*tok++ != ',')
+ {
+ error(comma_error);
+ goto loop;
+ }
+
+ if (eval == 0)
+ goto loop;
+
+ goto loop1;
+
+ case MN_MACRO: // .macro --- macro definition
+ if (!disabled)
+ {
+ // Label on a macro definition is bad mojo... Warn the user
+ if (label != NULL)
+ warn(lab_ignored);
+
+ DefineMacro();
+ }
+
+ goto loop;
+
+ case MN_EXITM: // .exitm --- exit macro
+ case MN_ENDM: // .endm --- same as .exitm
+ if (!disabled)
+ {
+ if (label != NULL)
+ warn(lab_ignored);
+
+ ExitMacro();
+ }
+
+ goto loop;
+
+ case MN_REPT:
+ if (!disabled)
+ {
+ // Handle labels on REPT directive lines...
+ if (label)
+ {
+ if (HandleLabel(label, labtyp) != 0)
+ goto loop;
+
+ label_defined = label;
+ }
+
+ HandleRept();
+ }
+
+ goto loop;
+
+ case MN_ENDR:
+ if (!disabled)
+ error("mis-nested .endr");
+
+ goto loop;
+ }
+ }
+
+normal:
+ if (disabled) // Conditionally disabled code
+ goto loop;
+
+ // Do equates
+ if (equate != NULL)
+ {
+ // Pick global or local symbol enviroment
+ j = (*equate == '.' ? curenv : 0);
+ sy = lookup(equate, LABEL, j);
+
+ if (sy == NULL)
+ {
+ sy = NewSymbol(equate, LABEL, j);
+ sy->sattr = 0;
+
+ if (equtyp == DEQUALS)
+ {
+ // Can't GLOBAL a local symbol
+ if (j)
+ {
+ error(locgl_error);
+ goto loop;
+ }
+
+ sy->sattr = GLOBAL;
+ }
+ }
+ else if ((sy->sattr & DEFINED) && equtyp != SET)
+ {
+ if ((equtyp == EQUREG) && (sy->sattre & UNDEF_EQUR))
+ {
+ sy->sattre &= ~UNDEF_EQUR;
+ sy->svalue = 0;
+ }
+ else if ((equtyp == CCDEF) && (sy->sattre & UNDEF_CC))
+ {
+ sy->sattre &= ~UNDEF_CC;
+ sy->svalue = 0;
+ }
+ else
+ {
+ error("multiple equate to '%s'", sy->sname);
+ goto loop;
+ }
+ }
+
+ // Put symbol in "order of definition" list if it's not already there
+ AddToSymbolDeclarationList(sy);
+
+ // Parse value to equate symbol to;
+ // o .equr
+ // o .reg
+ // o everything else
+ if (equtyp == EQUREG)
+ {
+//Linko's request to issue a warning on labels that equated to the same
+//register would go here. Not sure how to implement it though. :-/
+/*
+Maybe like this way:
+have an array of bools with 64 entries. Whenever a register is equated, set the
+corresponding register bool to true. Whenever it's undef'ed, set it to false.
+When checking to see if it's already been equated, issue a warning.
+*/
+
+ // Check for register to equate to
+ // This check will change once we split the registers per architecture into their own tables
+ // and out of kw.tab. But for now it'll do...
+ if ((*tok >= REG68_D0) && (*tok <= REG56_BA))
+ {
+ sy->sattre = EQUATEDREG; // Mark as equated register
+ equreg = *tok;
+ // Check for ",<bank #>" override notation and skip past it.
+ // It is ignored now. Was that ever useful anyway?
+ if ((rgpu ||rdsp) && (tok[1] == ',') && (tok[2] == CONST))
+ {
+ // Advance token pointer and skip everything
+ tok += 4;
+ }
+
+ eattr = ABS | DEFINED | GLOBAL;
+ eval = equreg;
+ tok++;
+ }
+ // Checking for a register symbol
+ else if (tok[0] == SYMBOL)
+ {
+ sy2 = lookup(string[tok[1]], LABEL, j);
+
+ // Make sure symbol is a valid equreg
+ if (!sy2 || !(sy2->sattre & EQUATEDREG))
+ {
+ error("invalid .equr/.regequ definition");
+ goto loop;
+ }
+ else
+ {
+ eattr = ABS | DEFINED | GLOBAL; // Copy symbol's attributes
+ sy->sattre = sy2->sattre;
+ eval = (sy2->svalue & 0xFFFFF0FF);
+ tok += 2;
+ }
+ }
+ else
+ {
+ error("invalid .equr/.regequ definition");
+ goto loop;
+ }
+ }
+ else if (equtyp == REG)
+ {
+ if (reglist(&rmask) < 0)
+ goto loop;
+
+ eval = (uint32_t)rmask;
+ eattr = ABS | DEFINED;
+ }
+ else if (equtyp == CCDEF)
+ {
+ sy->sattre |= EQUATEDCC;
+ eattr = ABS | DEFINED | GLOBAL;
+
+ if (tok[0] == SYMBOL)
+ {
+ sy2 = lookup(string[tok[1]], LABEL, j);
+
+ if (!sy2 || !(sy2->sattre & EQUATEDCC))
+ {
+ error("invalid gpu/dsp .ccdef definition");
+ goto loop;
+ }
+ else
+ {
+ eattr = ABS | DEFINED | GLOBAL;
+ sy->sattre = sy2->sattre;
+ eval = sy2->svalue;
+ tok += 2;
+ }
+ }
+ else if (expr(exprbuf, &eval, &eattr, &esym) != OK)
+ goto loop;
+ }
+ // equ an equr
+ else if (*tok == SYMBOL)
+ {
+ sy2 = lookup(string[tok[1]], LABEL, j);
+
+ if (sy2 && (sy2->sattre & EQUATEDREG))
+ {
+ sy->stype = sy2->stype;
+ sy->sattr = sy2->sattr;
+ sy->sattre = sy2->sattre;
+ sy->svalue = sy2->svalue;
+ goto loop;
+ }
+ else if (expr(exprbuf, &eval, &eattr, &esym) != OK)
+ goto loop;
+ }
+ else if (expr(exprbuf, &eval, &eattr, &esym) != OK)
+ goto loop;
+
+ if (!(eattr & DEFINED))
+ {
+ error(undef_error);
+ goto loop;
+ }
+
+ sy->sattr |= eattr | EQUATED; // Symbol inherits value and attributes
+ sy->svalue = eval;
+
+ if (list_flag) // Put value in listing
+ listvalue((uint32_t)eval);
+
+ ErrorIfNotAtEOL(); // Must be at EOL now
+ goto loop;
+ }
+
+ // Do labels
+ if (label != NULL)
+ {
+ // Non-zero == error occurred
+ if (HandleLabel(label, labtyp) != 0)
+ goto loop;
+
+ label_defined = label;
+ }
+
+ // Punt on EOL
+ if (state == -3)
+ goto loop;
+
+ // If we're in 6502 mode and are still in need of a mnemonic, then search
+ // for valid 6502 mnemonic.
+ if (m6502 && (state < 0 || state >= 1000))
+ {
+#ifdef ST
+ state = kmatch(opname, mpbase, mpcheck, mptab, mpaccept);
+#else
+ for(state=0, p=opname; state>= 0; )
+ {
+ j = mpbase[state] + tolowertab[*p];
+
+ if (mpcheck[j] != state) // Reject, character doesn't match
+ {
+ state = -1; // No match
+ break;
+ }
+
+ if (!*++p)
+ { // Must accept or reject at EOS
+ state = mpaccept[j]; // (-1 on no terminal match)
+ break;
+ }
+
+ state = mptab[j];
+ }
+#endif
+
+ // Call 6502 code generator if we found a mnemonic
+ if (state >= 2000)
+ {
+ m6502cg(state - 2000);
+ goto loop;
+ }
+ }
+
+ // If we are in GPU or DSP mode and still in need of a mnemonic then search
+ // for one
+ if ((rgpu || rdsp) && (state < 0 || state >= 1000))
+ {
+ for(state=0, p=opname; state>=0;)
+ {
+ j = mrbase[state] + (int)tolowertab[*p];
+
+ // Reject, character doesn't match
+ if (mrcheck[j] != state)
+ {
+ state = -1; // No match
+ break;
+ }
+
+ // Must accept or reject at EOS
+ if (!*++p)
+ {
+ state = mraccept[j]; // (-1 on no terminal match)
+ break;
+ }
+
+ state = mrtab[j];
+ }
+
+ // Call RISC code generator if we found a mnemonic
+ if (state >= 3000)
+ {
+ GenerateRISCCode(state);
+ goto loop;
+ }
+ }
+
+ // If we are in OP mode and still in need of a mnemonic then search for one
+ if (robjproc && ((state < 0) || (state >= 1000)))
+ {
+ for(state=0, p=opname; state>=0;)
+ {
+ j = mobase[state] + (int)tolowertab[*p];
+
+ // Reject, character doesn't match
+ if (mocheck[j] != state)
+ {
+ state = -1; // No match
+ break;
+ }
+
+ // Must accept or reject at EOS
+ if (!*++p)
+ {
+ state = moaccept[j]; // (-1 on no terminal match)
+ break;
+ }
+
+ state = motab[j];
+ }
+
+ // Call OP code generator if we found a mnemonic
+ if (state >= 3100)
+ {
+ GenerateOPCode(state);
+ goto loop;
+ }
+ }
+
+ // If we are in 56K mode and still in need of a mnemonic then search for one
+ if (dsp56001 && ((state < 0) || (state >= 1000)))
+ {
+ for(state=0, p=opname; state>=0;)
+ {
+ j = dspbase[state] + (int)tolowertab[*p];
+
+ // Reject, character doesn't match
+ if (dspcheck[j] != state)
+ {
+ state = -1; // No match
+ break;
+ }
+
+ // Must accept or reject at EOS
+ if (!*++p)
+ {
+ state = dspaccept[j]; // (-1 on no terminal match)
+ break;
+ }
+
+ state = dsptab[j];
+ }
+
+ // Call DSP code generator if we found a mnemonic
+ if (state >= 2000)
+ {
+ LONG parcode;
+ int operands;
+ MNTABDSP * md = &dsp56k_machtab[state - 2000];
+ deposit_extra_ea = 0; // Assume no extra word needed
+
+ if (md->mnfunc == dsp_mult)
+ {
+ // Special case for multiplication instructions: they require
+ // 3 operands
+ if ((operands = dsp_amode(3)) == ERROR)
+ goto loop;
+ }
+ else if ((md->mnattr & PARMOVE) && md->mn0 != M_AM_NONE)
+ {
+ if (dsp_amode(2) == ERROR)
+ goto loop;
+ }
+ else if ((md->mnattr & PARMOVE) && md->mn0 == M_AM_NONE)
+ {
+ // Instructions that have parallel moves but use no operands
+ // (probably only move). In this case, don't parse addressing
+ // modes--just go straight to parallel parse
+ dsp_am0 = dsp_am1 = M_AM_NONE;
+ }
+ else
+ {
+ // Non parallel move instructions can have up to 4 parameters
+ // (well, only tcc instructions really)
+ if ((operands = dsp_amode(4)) == ERROR)
+ goto loop;
+
+ if (operands == 4)
+ {
+ dsp_tcc4(md->mninst);
+ goto loop;
+ }
+ }
+
+ if (md->mnattr & PARMOVE)
+ {
+ // Check for parallel moves
+ if ((parcode = parmoves(dsp_a1reg)) == ERROR)
+ goto loop;
+ }
+ else
+ {
+ if (*tok != EOL)
+ error("parallel moves not allowed with this instruction");
+
+ parcode = 0;
+ }
+
+ while ((dsp_am0 & md->mn0) == 0 || (dsp_am1 & md->mn1) == 0)
+ md = &dsp56k_machtab[md->mncont];
+
+ GENLINENOSYM();
+ (*md->mnfunc)(md->mninst | (parcode << 8));
+ goto loop;
+ }
+ }
+
+ // Invoke macro or complain about bad mnemonic
+ if (state < 0)
+ {
+ if ((sy = lookup(opname, MACRO, 0)) != NULL)
+ InvokeMacro(sy, siz);
+ else
+ error("unknown op '%s'", opname);
+
+ goto loop;
+ }
+
+ // Call directive handlers
+ if (state < 500)
+ {
+ (*dirtab[state])(siz);
+ goto loop;
+ }
+
+ // Do mnemonics
+ // o can't deposit instrs in BSS or ABS
+ // o do automatic .EVEN for instrs
+ // o allocate space for largest possible instr
+ // o can't do ".b" operations with an address register
+ if (scattr & SBSS)
+ {
+ error("cannot initialize non-storage (BSS) section");
+ goto loop;
+ }
+
+ if (sloc & 1) // Automatic .even
+ auto_even();
+
+ if (challoc - ch_size < 18) // Make sure have space in current chunk
+ chcheck(0);
+
+ m = &machtab[state - 1000];
+
+ // Call special-mode handler
+ if (m->mnattr & CGSPECIAL)
+ {
+ GENLINENOSYM();
+ (*m->mnfunc)(m->mninst, siz);
+ goto loop;
+ }
+
+ if (amode(1) < 0) // Parse 0, 1 or 2 addr modes
+ goto loop;
+
+ // Check that we're at EOL
+ // The only exception is ptestr/ptestw instructions
+ // that have 3 or 4 operands and are not handled by
+ // amode(). (yes, we're taking a performance hit here sadly)
+ if (m->mnfunc != m_ptestr && m->mnfunc != m_ptestw)
+ if (*tok != EOL)
+ error(extra_stuff);
+
+ amsk0 = amsktab[am0];
+ amsk1 = amsktab[am1];
+
+ // Catch attempts to use ".B" with an address register (yes, this check
+ // does work at this level)
+ if (siz == SIZB && (am0 == AREG || am1 == AREG))
+ {
+ error("cannot use '.b' with an address register");
+ goto loop;
+ }
+
+ // Keep a backup of chptr (used for optimisations during codegen)
+ chptr_opcode = chptr;
+
+ while (!(m->mnattr & siz) || (amsk0 & m->mn0) == 0 || (amsk1 & m->mn1) == 0)
+ m = &machtab[m->mncont];
+
+ DEBUG { printf(" 68K: mninst=$%X, siz=$%X, mnattr=$%X, amsk0=$%X, mn0=$%X, amsk1=$%X, mn1=$%X\n", m->mninst, siz, m->mnattr, amsk0, m->mn0, amsk1, m->mn1); }
+
+ GENLINENOSYM();
+ (*m->mnfunc)(m->mninst, siz);
+ goto loop;