1 /* 2 * ***************************************************************************** 3 * 4 * SPDX-License-Identifier: BSD-2-Clause 5 * 6 * Copyright (c) 2018-2024 Gavin D. Howard and contributors. 7 * 8 * Redistribution and use in source and binary forms, with or without 9 * modification, are permitted provided that the following conditions are met: 10 * 11 * * Redistributions of source code must retain the above copyright notice, this 12 * list of conditions and the following disclaimer. 13 * 14 * * Redistributions in binary form must reproduce the above copyright notice, 15 * this list of conditions and the following disclaimer in the documentation 16 * and/or other materials provided with the distribution. 17 * 18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" 19 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 20 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 21 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE 22 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 23 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 24 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 25 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 26 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 27 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 28 * POSSIBILITY OF SUCH DAMAGE. 29 * 30 * ***************************************************************************** 31 * 32 * The parser for bc. 33 * 34 */ 35 36 #if BC_ENABLED 37 38 #include <assert.h> 39 #include <stdbool.h> 40 #include <stdlib.h> 41 #include <string.h> 42 43 #include <setjmp.h> 44 45 #include <bc.h> 46 #include <num.h> 47 #include <vm.h> 48 49 // Before you embark on trying to understand this code, have you read the 50 // Development manual (manuals/development.md) and the comment in include/bc.h 51 // yet? No? Do that first. I'm serious. 52 // 53 // The reason is because this file holds the most sensitive and finicky code in 54 // the entire codebase. Even getting history to work on Windows was nothing 55 // compared to this. This is where dreams go to die, where dragons live, and 56 // from which Ken Thompson himself would flee. 57 58 static void 59 bc_parse_else(BcParse* p); 60 61 static void 62 bc_parse_stmt(BcParse* p); 63 64 static BcParseStatus 65 bc_parse_expr_err(BcParse* p, uint8_t flags, BcParseNext next); 66 67 static void 68 bc_parse_expr_status(BcParse* p, uint8_t flags, BcParseNext next); 69 70 /** 71 * Returns true if an instruction could only have come from a "leaf" expression. 72 * For more on what leaf expressions are, read the comment for BC_PARSE_LEAF(). 73 * @param t The instruction to test. 74 * @return True if the instruction is a from a leaf expression. 75 */ 76 static bool 77 bc_parse_inst_isLeaf(BcInst t) 78 { 79 return (t >= BC_INST_NUM && t <= BC_INST_LEADING_ZERO) || 80 #if BC_ENABLE_EXTRA_MATH 81 t == BC_INST_TRUNC || 82 #endif // BC_ENABLE_EXTRA_MATH 83 t <= BC_INST_DEC; 84 } 85 86 /** 87 * Returns true if the *previous* token was a delimiter. A delimiter is anything 88 * that can legally end a statement. In bc's case, it could be a newline, a 89 * semicolon, and a brace in certain cases. 90 * @param p The parser. 91 * @return True if the token is a legal delimiter. 92 */ 93 static bool 94 bc_parse_isDelimiter(const BcParse* p) 95 { 96 BcLexType t = p->l.t; 97 bool good; 98 99 // If it's an obvious delimiter, say so. 100 if (BC_PARSE_DELIMITER(t)) return true; 101 102 good = false; 103 104 // If the current token is a keyword, then...beware. That means that we need 105 // to check for a "dangling" else, where there was no brace-delimited block 106 // on the previous if. 107 if (t == BC_LEX_KW_ELSE) 108 { 109 size_t i; 110 uint16_t *fptr = NULL, flags = BC_PARSE_FLAG_ELSE; 111 112 // As long as going up the stack is valid for a dangling else, keep on. 113 for (i = 0; i < p->flags.len && BC_PARSE_BLOCK_STMT(flags); ++i) 114 { 115 fptr = bc_vec_item_rev(&p->flags, i); 116 flags = *fptr; 117 118 // If we need a brace and don't have one, then we don't have a 119 // delimiter. 120 if ((flags & BC_PARSE_FLAG_BRACE) && p->l.last != BC_LEX_RBRACE) 121 { 122 return false; 123 } 124 } 125 126 // Oh, and we had also better have an if statement somewhere. 127 good = ((flags & BC_PARSE_FLAG_IF) != 0); 128 } 129 else if (t == BC_LEX_RBRACE) 130 { 131 size_t i; 132 133 // Since we have a brace, we need to just check if a brace was needed. 134 for (i = 0; !good && i < p->flags.len; ++i) 135 { 136 uint16_t* fptr = bc_vec_item_rev(&p->flags, i); 137 good = (((*fptr) & BC_PARSE_FLAG_BRACE) != 0); 138 } 139 } 140 141 return good; 142 } 143 144 /** 145 * Returns true if we are in top level of a function body. The POSIX grammar 146 * is defined such that anything is allowed after a function body, so we must 147 * use this function to detect that case when ending a function body. 148 * @param p The parser. 149 * @return True if we are in the top level of parsing a function body. 150 */ 151 static bool 152 bc_parse_TopFunc(const BcParse* p) 153 { 154 bool good = p->flags.len == 2; 155 156 uint16_t val = BC_PARSE_FLAG_BRACE | BC_PARSE_FLAG_FUNC_INNER; 157 val |= BC_PARSE_FLAG_FUNC; 158 159 return good && BC_PARSE_TOP_FLAG(p) == val; 160 } 161 162 /** 163 * Sets a previously defined exit label. What are labels? See the bc Parsing 164 * section of the Development manual (manuals/development.md). 165 * @param p The parser. 166 */ 167 static void 168 bc_parse_setLabel(BcParse* p) 169 { 170 BcFunc* func = p->func; 171 BcInstPtr* ip = bc_vec_top(&p->exits); 172 size_t* label; 173 174 assert(func == bc_vec_item(&p->prog->fns, p->fidx)); 175 176 // Set the preallocated label to the correct index. 177 label = bc_vec_item(&func->labels, ip->idx); 178 *label = func->code.len; 179 180 // Now, we don't need the exit label; it is done. 181 bc_vec_pop(&p->exits); 182 } 183 184 /** 185 * Creates a label and sets it to idx. If this is an exit label, then idx is 186 * actually invalid, but it doesn't matter because it will be fixed by 187 * bc_parse_setLabel() later. 188 * @param p The parser. 189 * @param idx The index of the label. 190 */ 191 static void 192 bc_parse_createLabel(BcParse* p, size_t idx) 193 { 194 bc_vec_push(&p->func->labels, &idx); 195 } 196 197 /** 198 * Creates a conditional label. Unlike an exit label, this label is set at 199 * creation time because it comes *before* the code that will target it. 200 * @param p The parser. 201 * @param idx The index of the label. 202 */ 203 static void 204 bc_parse_createCondLabel(BcParse* p, size_t idx) 205 { 206 bc_parse_createLabel(p, p->func->code.len); 207 bc_vec_push(&p->conds, &idx); 208 } 209 210 /** 211 * Creates an exit label to be filled in later by bc_parse_setLabel(). Also, why 212 * create a label to be filled in later? Because exit labels are meant to be 213 * targeted by code that comes *before* the label. Since we have to parse that 214 * code first, and don't know how long it will be, we need to just make sure to 215 * reserve a slot to be filled in later when we know. 216 * 217 * By the way, this uses BcInstPtr because it was convenient. The field idx 218 * holds the index, and the field func holds the loop boolean. 219 * 220 * @param p The parser. 221 * @param idx The index of the label's position. 222 * @param loop True if the exit label is for a loop or not. 223 */ 224 static void 225 bc_parse_createExitLabel(BcParse* p, size_t idx, bool loop) 226 { 227 BcInstPtr ip; 228 229 assert(p->func == bc_vec_item(&p->prog->fns, p->fidx)); 230 231 ip.func = loop; 232 ip.idx = idx; 233 ip.len = 0; 234 235 bc_vec_push(&p->exits, &ip); 236 bc_parse_createLabel(p, SIZE_MAX); 237 } 238 239 /** 240 * Pops the correct operators off of the operator stack based on the current 241 * operator. This is because of the Shunting-Yard algorithm. Lower prec means 242 * higher precedence. 243 * @param p The parser. 244 * @param type The operator. 245 * @param start The previous start of the operator stack. For more 246 * information, see the bc Parsing section of the Development 247 * manual (manuals/development.md). 248 * @param nexprs A pointer to the current number of expressions that have not 249 * been consumed yet. This is an IN and OUT parameter. 250 */ 251 static void 252 bc_parse_operator(BcParse* p, BcLexType type, size_t start, size_t* nexprs) 253 { 254 BcLexType t; 255 uchar l, r = BC_PARSE_OP_PREC(type); 256 uchar left = BC_PARSE_OP_LEFT(type); 257 258 // While we haven't hit the stop point yet... 259 while (p->ops.len > start) 260 { 261 // Get the top operator. 262 t = BC_PARSE_TOP_OP(p); 263 264 // If it's a left paren, we have reached the end of whatever expression 265 // this is no matter what. We also don't pop the left paren because it 266 // will need to stay for the rest of the subexpression. 267 if (t == BC_LEX_LPAREN) break; 268 269 // Break for precedence. Precedence operates differently on left and 270 // right associativity, by the way. A left associative operator that 271 // matches the current precedence should take priority, but a right 272 // associative operator should not. 273 // 274 // Also, a lower precedence value means a higher precedence. 275 l = BC_PARSE_OP_PREC(t); 276 if (l >= r && (l != r || !left)) break; 277 278 // Do the housekeeping. In particular, make sure to note that one 279 // expression was consumed (well, two were, but another was added) if 280 // the operator was not a prefix operator. (Postfix operators are not 281 // handled by this function at all.) 282 bc_parse_push(p, BC_PARSE_TOKEN_INST(t)); 283 bc_vec_pop(&p->ops); 284 *nexprs -= !BC_PARSE_OP_PREFIX(t); 285 } 286 287 bc_vec_push(&p->ops, &type); 288 } 289 290 /** 291 * Parses a right paren. In the Shunting-Yard algorithm, it needs to be put on 292 * the operator stack. But before that, it needs to consume whatever operators 293 * there are until it hits a left paren. 294 * @param p The parser. 295 * @param nexprs A pointer to the current number of expressions that have not 296 * been consumed yet. This is an IN and OUT parameter. 297 */ 298 static void 299 bc_parse_rightParen(BcParse* p, size_t* nexprs) 300 { 301 BcLexType top; 302 303 // Consume operators until a left paren. 304 while ((top = BC_PARSE_TOP_OP(p)) != BC_LEX_LPAREN) 305 { 306 bc_parse_push(p, BC_PARSE_TOKEN_INST(top)); 307 bc_vec_pop(&p->ops); 308 *nexprs -= !BC_PARSE_OP_PREFIX(top); 309 } 310 311 // We need to pop the left paren as well. 312 bc_vec_pop(&p->ops); 313 314 // Oh, and we also want the next token. 315 bc_lex_next(&p->l); 316 } 317 318 /** 319 * Parses function arguments. 320 * @param p The parser. 321 * @param flags Flags restricting what kind of expressions the arguments can 322 * be. 323 */ 324 static void 325 bc_parse_args(BcParse* p, uint8_t flags) 326 { 327 bool comma = false; 328 size_t nargs; 329 330 bc_lex_next(&p->l); 331 332 // Print and comparison operators not allowed. Well, comparison operators 333 // only for POSIX. But we do allow arrays, and we *must* get a value. 334 flags &= ~(BC_PARSE_PRINT | BC_PARSE_REL); 335 flags |= (BC_PARSE_ARRAY | BC_PARSE_NEEDVAL); 336 337 // Count the arguments and parse them. 338 for (nargs = 0; p->l.t != BC_LEX_RPAREN; ++nargs) 339 { 340 bc_parse_expr_status(p, flags, bc_parse_next_arg); 341 342 comma = (p->l.t == BC_LEX_COMMA); 343 if (comma) bc_lex_next(&p->l); 344 } 345 346 // An ending comma is FAIL. 347 if (BC_ERR(comma)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 348 349 // Now do the call with the number of arguments. 350 bc_parse_push(p, BC_INST_CALL); 351 bc_parse_pushIndex(p, nargs); 352 } 353 354 /** 355 * Parses a function call. 356 * @param p The parser. 357 * @param flags Flags restricting what kind of expressions the arguments can 358 * be. 359 */ 360 static void 361 bc_parse_call(BcParse* p, const char* name, uint8_t flags) 362 { 363 size_t idx; 364 365 bc_parse_args(p, flags); 366 367 // We just assert this because bc_parse_args() should 368 // ensure that the next token is what it should be. 369 assert(p->l.t == BC_LEX_RPAREN); 370 371 // We cannot use bc_program_insertFunc() here 372 // because it will overwrite an existing function. 373 idx = bc_map_index(&p->prog->fn_map, name); 374 375 // The function does not exist yet. Create a space for it. If the user does 376 // not define it, it's a *runtime* error, not a parse error. 377 if (idx == BC_VEC_INVALID_IDX) 378 { 379 idx = bc_program_insertFunc(p->prog, name); 380 381 assert(idx != BC_VEC_INVALID_IDX); 382 383 // Make sure that this pointer was not invalidated. 384 p->func = bc_vec_item(&p->prog->fns, p->fidx); 385 } 386 // The function exists, so set the right function index. 387 else idx = ((BcId*) bc_vec_item(&p->prog->fn_map, idx))->idx; 388 389 bc_parse_pushIndex(p, idx); 390 391 // Make sure to get the next token. 392 bc_lex_next(&p->l); 393 } 394 395 /** 396 * Parses a name/identifier-based expression. It could be a variable, an array 397 * element, an array itself (for function arguments), a function call, etc. 398 * @param p The parser. 399 * @param type A pointer to return the resulting instruction. 400 * @param can_assign A pointer to return true if the name can be assigned to, 401 * false otherwise. 402 * @param flags Flags restricting what kind of expression the name can be. 403 */ 404 static void 405 bc_parse_name(BcParse* p, BcInst* type, bool* can_assign, uint8_t flags) 406 { 407 char* name; 408 409 BC_SIG_ASSERT_LOCKED; 410 411 // We want a copy of the name since the lexer might overwrite its copy. 412 name = bc_vm_strdup(p->l.str.v); 413 414 BC_SETJMP_LOCKED(vm, err); 415 416 // We need the next token to see if it's just a variable or something more. 417 bc_lex_next(&p->l); 418 419 // Array element or array. 420 if (p->l.t == BC_LEX_LBRACKET) 421 { 422 bc_lex_next(&p->l); 423 424 // Array only. This has to be a function parameter. 425 if (p->l.t == BC_LEX_RBRACKET) 426 { 427 // Error if arrays are not allowed. 428 if (BC_ERR(!(flags & BC_PARSE_ARRAY))) 429 { 430 bc_parse_err(p, BC_ERR_PARSE_EXPR); 431 } 432 433 *type = BC_INST_ARRAY; 434 *can_assign = false; 435 } 436 else 437 { 438 // If we are here, we have an array element. We need to set the 439 // expression parsing flags. 440 uint8_t flags2 = (flags & ~(BC_PARSE_PRINT | BC_PARSE_REL)) | 441 BC_PARSE_NEEDVAL; 442 443 bc_parse_expr_status(p, flags2, bc_parse_next_elem); 444 445 // The next token *must* be a right bracket. 446 if (BC_ERR(p->l.t != BC_LEX_RBRACKET)) 447 { 448 bc_parse_err(p, BC_ERR_PARSE_TOKEN); 449 } 450 451 *type = BC_INST_ARRAY_ELEM; 452 *can_assign = true; 453 } 454 455 // Make sure to get the next token. 456 bc_lex_next(&p->l); 457 458 // Push the instruction and the name of the identifier. 459 bc_parse_push(p, *type); 460 bc_parse_pushName(p, name, false); 461 } 462 else if (p->l.t == BC_LEX_LPAREN) 463 { 464 // We are parsing a function call; error if not allowed. 465 if (BC_ERR(flags & BC_PARSE_NOCALL)) 466 { 467 bc_parse_err(p, BC_ERR_PARSE_TOKEN); 468 } 469 470 *type = BC_INST_CALL; 471 *can_assign = false; 472 473 bc_parse_call(p, name, flags); 474 } 475 else 476 { 477 // Just a variable. 478 *type = BC_INST_VAR; 479 *can_assign = true; 480 bc_parse_push(p, BC_INST_VAR); 481 bc_parse_pushName(p, name, true); 482 } 483 484 err: 485 // Need to make sure to unallocate the name. 486 free(name); 487 BC_LONGJMP_CONT(vm); 488 BC_SIG_MAYLOCK; 489 } 490 491 /** 492 * Parses a builtin function that takes no arguments. This includes read(), 493 * rand(), maxibase(), maxobase(), maxscale(), and maxrand(). 494 * @param p The parser. 495 * @param inst The instruction corresponding to the builtin. 496 */ 497 static void 498 bc_parse_noArgBuiltin(BcParse* p, BcInst inst) 499 { 500 // Must have a left paren. 501 bc_lex_next(&p->l); 502 if (BC_ERR(p->l.t != BC_LEX_LPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 503 504 // Must have a right paren. 505 bc_lex_next(&p->l); 506 if ((p->l.t != BC_LEX_RPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 507 508 bc_parse_push(p, inst); 509 510 bc_lex_next(&p->l); 511 } 512 513 /** 514 * Parses a builtin function that takes 1 argument. This includes length(), 515 * sqrt(), abs(), scale(), and irand(). 516 * @param p The parser. 517 * @param type The lex token. 518 * @param flags The expression parsing flags for parsing the argument. 519 * @param prev An out parameter; the previous instruction pointer. 520 */ 521 static void 522 bc_parse_builtin(BcParse* p, BcLexType type, uint8_t flags, BcInst* prev) 523 { 524 // Must have a left paren. 525 bc_lex_next(&p->l); 526 if (BC_ERR(p->l.t != BC_LEX_LPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 527 528 bc_lex_next(&p->l); 529 530 // Change the flags as needed for parsing the argument. 531 flags &= ~(BC_PARSE_PRINT | BC_PARSE_REL); 532 flags |= BC_PARSE_NEEDVAL; 533 534 // Since length can take arrays, we need to specially add that flag. 535 if (type == BC_LEX_KW_LENGTH || type == BC_LEX_KW_ASCIIFY) 536 { 537 flags |= BC_PARSE_ARRAY; 538 } 539 540 // Otherwise, we need to clear it because it could be set. 541 else flags &= ~(BC_PARSE_ARRAY); 542 543 bc_parse_expr_status(p, flags, bc_parse_next_rel); 544 545 // Must have a right paren. 546 if (BC_ERR(p->l.t != BC_LEX_RPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 547 548 // Adjust previous based on the token and push it. 549 *prev = type - BC_LEX_KW_LENGTH + BC_INST_LENGTH; 550 bc_parse_push(p, *prev); 551 552 bc_lex_next(&p->l); 553 } 554 555 /** 556 * Parses a builtin function that takes 3 arguments. This includes modexp() and 557 * divmod(). 558 * @param p The parser. 559 * @param type The lex token. 560 * @param flags The expression parsing flags for parsing the argument. 561 * @param prev An out parameter; the previous instruction pointer. 562 */ 563 static void 564 bc_parse_builtin3(BcParse* p, BcLexType type, uint8_t flags, BcInst* prev) 565 { 566 assert(type == BC_LEX_KW_MODEXP || type == BC_LEX_KW_DIVMOD); 567 568 // Must have a left paren. 569 bc_lex_next(&p->l); 570 if (BC_ERR(p->l.t != BC_LEX_LPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 571 572 bc_lex_next(&p->l); 573 574 // Change the flags as needed for parsing the argument. 575 flags &= ~(BC_PARSE_PRINT | BC_PARSE_REL); 576 flags |= BC_PARSE_NEEDVAL; 577 578 bc_parse_expr_status(p, flags, bc_parse_next_builtin); 579 580 // Must have a comma. 581 if (BC_ERR(p->l.t != BC_LEX_COMMA)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 582 583 bc_lex_next(&p->l); 584 585 bc_parse_expr_status(p, flags, bc_parse_next_builtin); 586 587 // Must have a comma. 588 if (BC_ERR(p->l.t != BC_LEX_COMMA)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 589 590 bc_lex_next(&p->l); 591 592 // If it is a divmod, parse an array name. Otherwise, just parse another 593 // expression. 594 if (type == BC_LEX_KW_DIVMOD) 595 { 596 // Must have a name. 597 if (BC_ERR(p->l.t != BC_LEX_NAME)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 598 599 // This is safe because the next token should not overwrite the name. 600 bc_lex_next(&p->l); 601 602 // Must have a left bracket. 603 if (BC_ERR(p->l.t != BC_LEX_LBRACKET)) 604 { 605 bc_parse_err(p, BC_ERR_PARSE_TOKEN); 606 } 607 608 // This is safe because the next token should not overwrite the name. 609 bc_lex_next(&p->l); 610 611 // Must have a right bracket. 612 if (BC_ERR(p->l.t != BC_LEX_RBRACKET)) 613 { 614 bc_parse_err(p, BC_ERR_PARSE_TOKEN); 615 } 616 617 // This is safe because the next token should not overwrite the name. 618 bc_lex_next(&p->l); 619 } 620 else bc_parse_expr_status(p, flags, bc_parse_next_rel); 621 622 // Must have a right paren. 623 if (BC_ERR(p->l.t != BC_LEX_RPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 624 625 // Adjust previous based on the token and push it. 626 *prev = type - BC_LEX_KW_MODEXP + BC_INST_MODEXP; 627 bc_parse_push(p, *prev); 628 629 // If we have divmod, we need to assign the modulus to the array element, so 630 // we need to push the instructions for doing so. 631 if (type == BC_LEX_KW_DIVMOD) 632 { 633 // The zeroth element. 634 bc_parse_push(p, BC_INST_ZERO); 635 bc_parse_push(p, BC_INST_ARRAY_ELEM); 636 637 // Push the array. 638 bc_parse_pushName(p, p->l.str.v, false); 639 640 // Swap them and assign. After this, the top item on the stack should 641 // be the quotient. 642 bc_parse_push(p, BC_INST_SWAP); 643 bc_parse_push(p, BC_INST_ASSIGN_NO_VAL); 644 } 645 646 bc_lex_next(&p->l); 647 } 648 649 /** 650 * Parses the scale keyword. This is special because scale can be a value or a 651 * builtin function. 652 * @param p The parser. 653 * @param type An out parameter; the instruction for the parse. 654 * @param can_assign An out parameter; whether the expression can be assigned 655 * to. 656 * @param flags The expression parsing flags for parsing a scale() arg. 657 */ 658 static void 659 bc_parse_scale(BcParse* p, BcInst* type, bool* can_assign, uint8_t flags) 660 { 661 bc_lex_next(&p->l); 662 663 // Without the left paren, it's just the keyword. 664 if (p->l.t != BC_LEX_LPAREN) 665 { 666 // Set, push, and return. 667 *type = BC_INST_SCALE; 668 *can_assign = true; 669 bc_parse_push(p, BC_INST_SCALE); 670 return; 671 } 672 673 // Handle the scale function. 674 *type = BC_INST_SCALE_FUNC; 675 *can_assign = false; 676 677 // Once again, adjust the flags. 678 flags &= ~(BC_PARSE_PRINT | BC_PARSE_REL); 679 flags |= BC_PARSE_NEEDVAL; 680 681 bc_lex_next(&p->l); 682 683 bc_parse_expr_status(p, flags, bc_parse_next_rel); 684 685 // Must have a right paren. 686 if (BC_ERR(p->l.t != BC_LEX_RPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 687 688 bc_parse_push(p, BC_INST_SCALE_FUNC); 689 690 bc_lex_next(&p->l); 691 } 692 693 /** 694 * Parses and increment or decrement operator. This is a bit complex. 695 * @param p The parser. 696 * @param prev An out parameter; the previous instruction pointer. 697 * @param can_assign An out parameter; whether the expression can be assigned 698 * to. 699 * @param nexs An in/out parameter; the number of expressions in the 700 * parse tree that are not used. 701 * @param flags The expression parsing flags for parsing a scale() arg. 702 */ 703 static void 704 bc_parse_incdec(BcParse* p, BcInst* prev, bool* can_assign, size_t* nexs, 705 uint8_t flags) 706 { 707 BcLexType type; 708 uchar inst; 709 BcInst etype = *prev; 710 BcLexType last = p->l.last; 711 712 assert(prev != NULL && can_assign != NULL); 713 714 // If we can't assign to the previous token, then we have an error. 715 if (BC_ERR(last == BC_LEX_OP_INC || last == BC_LEX_OP_DEC || 716 last == BC_LEX_RPAREN)) 717 { 718 bc_parse_err(p, BC_ERR_PARSE_ASSIGN); 719 } 720 721 // Is the previous instruction for a variable? 722 if (BC_PARSE_INST_VAR(etype)) 723 { 724 // If so, this is a postfix operator. 725 if (!*can_assign) bc_parse_err(p, BC_ERR_PARSE_ASSIGN); 726 727 // Only postfix uses BC_INST_INC and BC_INST_DEC. 728 *prev = inst = BC_INST_INC + (p->l.t != BC_LEX_OP_INC); 729 bc_parse_push(p, inst); 730 bc_lex_next(&p->l); 731 *can_assign = false; 732 } 733 else 734 { 735 // This is a prefix operator. In that case, we just convert it to 736 // an assignment instruction. 737 *prev = inst = BC_INST_ASSIGN_PLUS + (p->l.t != BC_LEX_OP_INC); 738 739 bc_lex_next(&p->l); 740 type = p->l.t; 741 742 // Because we parse the next part of the expression 743 // right here, we need to increment this. 744 *nexs = *nexs + 1; 745 746 // Is the next token a normal identifier? 747 if (type == BC_LEX_NAME) 748 { 749 // Parse the name. 750 uint8_t flags2 = flags & ~(BC_PARSE_ARRAY); 751 bc_parse_name(p, prev, can_assign, flags2 | BC_PARSE_NOCALL); 752 } 753 // Is the next token a global? 754 else if (type >= BC_LEX_KW_LAST && type <= BC_LEX_KW_OBASE) 755 { 756 bc_parse_push(p, type - BC_LEX_KW_LAST + BC_INST_LAST); 757 bc_lex_next(&p->l); 758 } 759 // Is the next token specifically scale, which needs special treatment? 760 else if (BC_NO_ERR(type == BC_LEX_KW_SCALE)) 761 { 762 bc_lex_next(&p->l); 763 764 // Check that scale() was not used. 765 if (BC_ERR(p->l.t == BC_LEX_LPAREN)) 766 { 767 bc_parse_err(p, BC_ERR_PARSE_TOKEN); 768 } 769 else bc_parse_push(p, BC_INST_SCALE); 770 } 771 // Now we know we have an error. 772 else bc_parse_err(p, BC_ERR_PARSE_TOKEN); 773 774 *can_assign = false; 775 776 bc_parse_push(p, BC_INST_ONE); 777 bc_parse_push(p, inst); 778 } 779 } 780 781 /** 782 * Parses the minus operator. This needs special treatment because it is either 783 * subtract or negation. 784 * @param p The parser. 785 * @param prev An in/out parameter; the previous instruction. 786 * @param ops_bgn The size of the operator stack. 787 * @param rparen True if the last token was a right paren. 788 * @param binlast True if the last token was a binary operator. 789 * @param nexprs An in/out parameter; the number of unused expressions. 790 */ 791 static void 792 bc_parse_minus(BcParse* p, BcInst* prev, size_t ops_bgn, bool rparen, 793 bool binlast, size_t* nexprs) 794 { 795 BcLexType type; 796 797 bc_lex_next(&p->l); 798 799 // Figure out if it's a minus or a negation. 800 type = BC_PARSE_LEAF(*prev, binlast, rparen) ? BC_LEX_OP_MINUS : BC_LEX_NEG; 801 *prev = BC_PARSE_TOKEN_INST(type); 802 803 // We can just push onto the op stack because this is the largest 804 // precedence operator that gets pushed. Inc/dec does not. 805 if (type != BC_LEX_OP_MINUS) bc_vec_push(&p->ops, &type); 806 else bc_parse_operator(p, type, ops_bgn, nexprs); 807 } 808 809 /** 810 * Parses a string. 811 * @param p The parser. 812 * @param inst The instruction corresponding to how the string was found and 813 * how it should be printed. 814 */ 815 static void 816 bc_parse_str(BcParse* p, BcInst inst) 817 { 818 bc_parse_addString(p); 819 bc_parse_push(p, inst); 820 bc_lex_next(&p->l); 821 } 822 823 /** 824 * Parses a print statement. 825 * @param p The parser. 826 */ 827 static void 828 bc_parse_print(BcParse* p, BcLexType type) 829 { 830 BcLexType t; 831 bool comma = false; 832 BcInst inst = type == BC_LEX_KW_STREAM ? BC_INST_PRINT_STREAM : 833 BC_INST_PRINT_POP; 834 835 bc_lex_next(&p->l); 836 837 t = p->l.t; 838 839 // A print or stream statement has to have *something*. 840 if (bc_parse_isDelimiter(p)) bc_parse_err(p, BC_ERR_PARSE_PRINT); 841 842 do 843 { 844 // If the token is a string, then print it with escapes. 845 // BC_INST_PRINT_POP plays that role for bc. 846 if (t == BC_LEX_STR) bc_parse_str(p, inst); 847 else 848 { 849 // We have an actual number; parse and add a print instruction. 850 bc_parse_expr_status(p, BC_PARSE_NEEDVAL, bc_parse_next_print); 851 bc_parse_push(p, inst); 852 } 853 854 // Is the next token a comma? 855 comma = (p->l.t == BC_LEX_COMMA); 856 857 // Get the next token if we have a comma. 858 if (comma) bc_lex_next(&p->l); 859 else 860 { 861 // If we don't have a comma, the statement needs to end. 862 if (!bc_parse_isDelimiter(p)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 863 else break; 864 } 865 866 t = p->l.t; 867 } 868 while (true); 869 870 // If we have a comma but no token, that's bad. 871 if (BC_ERR(comma)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 872 } 873 874 /** 875 * Parses a return statement. 876 * @param p The parser. 877 */ 878 static void 879 bc_parse_return(BcParse* p) 880 { 881 BcLexType t; 882 bool paren; 883 uchar inst = BC_INST_RET0; 884 885 // If we are not in a function, that's an error. 886 if (BC_ERR(!BC_PARSE_FUNC(p))) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 887 888 // If we are in a void function, make sure to return void. 889 if (p->func->voidfn) inst = BC_INST_RET_VOID; 890 891 bc_lex_next(&p->l); 892 893 t = p->l.t; 894 paren = (t == BC_LEX_LPAREN); 895 896 // An empty return statement just needs to push the selected instruction. 897 if (bc_parse_isDelimiter(p)) bc_parse_push(p, inst); 898 else 899 { 900 BcParseStatus s; 901 902 // Need to parse the expression whose value will be returned. 903 s = bc_parse_expr_err(p, BC_PARSE_NEEDVAL, bc_parse_next_expr); 904 905 // If the expression was empty, just push the selected instruction. 906 if (s == BC_PARSE_STATUS_EMPTY_EXPR) 907 { 908 bc_parse_push(p, inst); 909 bc_lex_next(&p->l); 910 } 911 912 // POSIX requires parentheses. 913 if (!paren || p->l.last != BC_LEX_RPAREN) 914 { 915 bc_parse_err(p, BC_ERR_POSIX_RET); 916 } 917 918 // Void functions require an empty expression. 919 if (BC_ERR(p->func->voidfn)) 920 { 921 if (s != BC_PARSE_STATUS_EMPTY_EXPR) 922 { 923 bc_parse_verr(p, BC_ERR_PARSE_RET_VOID, p->func->name); 924 } 925 } 926 // If we got here, we want to be sure to end the function with a real 927 // return instruction, just in case. 928 else bc_parse_push(p, BC_INST_RET); 929 } 930 } 931 932 /** 933 * Clears flags that indicate the end of an if statement and its block and sets 934 * the jump location. 935 * @param p The parser. 936 */ 937 static void 938 bc_parse_noElse(BcParse* p) 939 { 940 uint16_t* flag_ptr = BC_PARSE_TOP_FLAG_PTR(p); 941 *flag_ptr = (*flag_ptr & ~(BC_PARSE_FLAG_IF_END)); 942 bc_parse_setLabel(p); 943 } 944 945 /** 946 * Ends (finishes parsing) the body of a control statement or a function. 947 * @param p The parser. 948 * @param brace True if the body was ended by a brace, false otherwise. 949 */ 950 static void 951 bc_parse_endBody(BcParse* p, bool brace) 952 { 953 bool has_brace, new_else = false; 954 955 // We cannot be ending a body if there are no bodies to end. 956 if (BC_ERR(p->flags.len <= 1)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 957 958 if (brace) 959 { 960 // The brace was already gotten; make sure that the caller did not lie. 961 // We check for the requirement of braces later. 962 assert(p->l.t == BC_LEX_RBRACE); 963 964 bc_lex_next(&p->l); 965 966 // If the next token is not a delimiter, that is a problem. 967 if (BC_ERR(!bc_parse_isDelimiter(p) && !bc_parse_TopFunc(p))) 968 { 969 bc_parse_err(p, BC_ERR_PARSE_TOKEN); 970 } 971 } 972 973 // Do we have a brace flag? 974 has_brace = (BC_PARSE_BRACE(p) != 0); 975 976 do 977 { 978 size_t len = p->flags.len; 979 bool loop; 980 981 // If we have a brace flag but not a brace, that's a problem. 982 if (has_brace && !brace) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 983 984 // Are we inside a loop? 985 loop = (BC_PARSE_LOOP_INNER(p) != 0); 986 987 // If we are ending a loop or an else... 988 if (loop || BC_PARSE_ELSE(p)) 989 { 990 // Loops have condition labels that we have to take care of as well. 991 if (loop) 992 { 993 size_t* label = bc_vec_top(&p->conds); 994 995 bc_parse_push(p, BC_INST_JUMP); 996 bc_parse_pushIndex(p, *label); 997 998 bc_vec_pop(&p->conds); 999 } 1000 1001 bc_parse_setLabel(p); 1002 bc_vec_pop(&p->flags); 1003 } 1004 // If we are ending a function... 1005 else if (BC_PARSE_FUNC_INNER(p)) 1006 { 1007 BcInst inst = (p->func->voidfn ? BC_INST_RET_VOID : BC_INST_RET0); 1008 bc_parse_push(p, inst); 1009 bc_parse_updateFunc(p, BC_PROG_MAIN); 1010 bc_vec_pop(&p->flags); 1011 } 1012 // If we have a brace flag and not an if statement, we can pop the top 1013 // of the flags stack because they have been taken care of above. 1014 else if (has_brace && !BC_PARSE_IF(p)) bc_vec_pop(&p->flags); 1015 1016 // This needs to be last to parse nested if's properly. 1017 if (BC_PARSE_IF(p) && (len == p->flags.len || !BC_PARSE_BRACE(p))) 1018 { 1019 // Eat newlines. 1020 while (p->l.t == BC_LEX_NLINE) 1021 { 1022 bc_lex_next(&p->l); 1023 } 1024 1025 // *Now* we can pop the flags. 1026 bc_vec_pop(&p->flags); 1027 1028 // If we are allowed non-POSIX stuff... 1029 if (!BC_S) 1030 { 1031 // Have we found yet another dangling else? 1032 *(BC_PARSE_TOP_FLAG_PTR(p)) |= BC_PARSE_FLAG_IF_END; 1033 new_else = (p->l.t == BC_LEX_KW_ELSE); 1034 1035 // Parse the else or end the if statement body. 1036 if (new_else) bc_parse_else(p); 1037 else if (!has_brace && (!BC_PARSE_IF_END(p) || brace)) 1038 { 1039 bc_parse_noElse(p); 1040 } 1041 } 1042 // POSIX requires us to do the bare minimum only. 1043 else bc_parse_noElse(p); 1044 } 1045 1046 // If these are both true, we have "used" the braces that we found. 1047 if (brace && has_brace) brace = false; 1048 } 1049 // This condition was perhaps the hardest single part of the parser. If 1050 // the flags stack does not have enough, we should stop. If we have a 1051 // new else statement, we should stop. If we do have the end of an if 1052 // statement and we have eaten the brace, we should stop. If we do have 1053 // a brace flag, we should stop. 1054 while (p->flags.len > 1 && !new_else && (!BC_PARSE_IF_END(p) || brace) && 1055 !(has_brace = (BC_PARSE_BRACE(p) != 0))); 1056 1057 // If we have a brace, yet no body for it, that's a problem. 1058 if (BC_ERR(p->flags.len == 1 && brace)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1059 else if (brace && BC_PARSE_BRACE(p)) 1060 { 1061 // If we make it here, we have a brace and a flag for it. 1062 uint16_t flags = BC_PARSE_TOP_FLAG(p); 1063 1064 // This condition ensure that the *last* body is correctly finished by 1065 // popping its flags. 1066 if (!(flags & (BC_PARSE_FLAG_FUNC_INNER | BC_PARSE_FLAG_LOOP_INNER)) && 1067 !(flags & (BC_PARSE_FLAG_IF | BC_PARSE_FLAG_ELSE)) && 1068 !(flags & (BC_PARSE_FLAG_IF_END))) 1069 { 1070 bc_vec_pop(&p->flags); 1071 } 1072 } 1073 } 1074 1075 /** 1076 * Starts the body of a control statement or function. 1077 * @param p The parser. 1078 * @param flags The current flags (will be edited). 1079 */ 1080 static void 1081 bc_parse_startBody(BcParse* p, uint16_t flags) 1082 { 1083 assert(flags); 1084 flags |= (BC_PARSE_TOP_FLAG(p) & (BC_PARSE_FLAG_FUNC | BC_PARSE_FLAG_LOOP)); 1085 flags |= BC_PARSE_FLAG_BODY; 1086 bc_vec_push(&p->flags, &flags); 1087 } 1088 1089 void 1090 bc_parse_endif(BcParse* p) 1091 { 1092 size_t i; 1093 bool good; 1094 1095 // Not a problem if this is true. 1096 if (BC_NO_ERR(!BC_PARSE_NO_EXEC(p))) return; 1097 1098 good = true; 1099 1100 // Find an instance of a body that needs closing, i.e., a statement that did 1101 // not have a right brace when it should have. 1102 for (i = 0; good && i < p->flags.len; ++i) 1103 { 1104 uint16_t flag = *((uint16_t*) bc_vec_item(&p->flags, i)); 1105 good = ((flag & BC_PARSE_FLAG_BRACE) != BC_PARSE_FLAG_BRACE); 1106 } 1107 1108 // If we did not find such an instance... 1109 if (good) 1110 { 1111 // We set this to restore it later. We don't want the parser thinking 1112 // that we are on stdin for this one because it will want more. 1113 BcMode mode = vm->mode; 1114 1115 vm->mode = BC_MODE_FILE; 1116 1117 // End all of the if statements and loops. 1118 while (p->flags.len > 1 || BC_PARSE_IF_END(p)) 1119 { 1120 if (BC_PARSE_IF_END(p)) bc_parse_noElse(p); 1121 if (p->flags.len > 1) bc_parse_endBody(p, false); 1122 } 1123 1124 vm->mode = (uchar) mode; 1125 } 1126 // If we reach here, a block was not properly closed, and we should error. 1127 else bc_parse_err(&vm->prs, BC_ERR_PARSE_BLOCK); 1128 } 1129 1130 /** 1131 * Parses an if statement. 1132 * @param p The parser. 1133 */ 1134 static void 1135 bc_parse_if(BcParse* p) 1136 { 1137 // We are allowed relational operators, and we must have a value. 1138 size_t idx; 1139 uint8_t flags = (BC_PARSE_REL | BC_PARSE_NEEDVAL); 1140 1141 // Get the left paren and barf if necessary. 1142 bc_lex_next(&p->l); 1143 if (BC_ERR(p->l.t != BC_LEX_LPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1144 1145 // Parse the condition. 1146 bc_lex_next(&p->l); 1147 bc_parse_expr_status(p, flags, bc_parse_next_rel); 1148 1149 // Must have a right paren. 1150 if (BC_ERR(p->l.t != BC_LEX_RPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1151 1152 bc_lex_next(&p->l); 1153 1154 // Insert the conditional jump instruction. 1155 bc_parse_push(p, BC_INST_JUMP_ZERO); 1156 1157 idx = p->func->labels.len; 1158 1159 // Push the index for the instruction and create an exit label for an else 1160 // statement. 1161 bc_parse_pushIndex(p, idx); 1162 bc_parse_createExitLabel(p, idx, false); 1163 1164 bc_parse_startBody(p, BC_PARSE_FLAG_IF); 1165 } 1166 1167 /** 1168 * Parses an else statement. 1169 * @param p The parser. 1170 */ 1171 static void 1172 bc_parse_else(BcParse* p) 1173 { 1174 size_t idx = p->func->labels.len; 1175 1176 // We must be at the end of an if statement. 1177 if (BC_ERR(!BC_PARSE_IF_END(p))) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1178 1179 // Push an unconditional jump to make bc jump over the else statement if it 1180 // executed the original if statement. 1181 bc_parse_push(p, BC_INST_JUMP); 1182 bc_parse_pushIndex(p, idx); 1183 1184 // Clear the else stuff. Yes, that function is misnamed for its use here, 1185 // but deal with it. 1186 bc_parse_noElse(p); 1187 1188 // Create the exit label and parse the body. 1189 bc_parse_createExitLabel(p, idx, false); 1190 bc_parse_startBody(p, BC_PARSE_FLAG_ELSE); 1191 1192 bc_lex_next(&p->l); 1193 } 1194 1195 /** 1196 * Parse a while loop. 1197 * @param p The parser. 1198 */ 1199 static void 1200 bc_parse_while(BcParse* p) 1201 { 1202 // We are allowed relational operators, and we must have a value. 1203 size_t idx; 1204 uint8_t flags = (BC_PARSE_REL | BC_PARSE_NEEDVAL); 1205 1206 // Get the left paren and barf if necessary. 1207 bc_lex_next(&p->l); 1208 if (BC_ERR(p->l.t != BC_LEX_LPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1209 bc_lex_next(&p->l); 1210 1211 // Create the labels. Loops need both. 1212 bc_parse_createCondLabel(p, p->func->labels.len); 1213 idx = p->func->labels.len; 1214 bc_parse_createExitLabel(p, idx, true); 1215 1216 // Parse the actual condition and barf on non-right paren. 1217 bc_parse_expr_status(p, flags, bc_parse_next_rel); 1218 if (BC_ERR(p->l.t != BC_LEX_RPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1219 bc_lex_next(&p->l); 1220 1221 // Now we can push the conditional jump and start the body. 1222 bc_parse_push(p, BC_INST_JUMP_ZERO); 1223 bc_parse_pushIndex(p, idx); 1224 bc_parse_startBody(p, BC_PARSE_FLAG_LOOP | BC_PARSE_FLAG_LOOP_INNER); 1225 } 1226 1227 /** 1228 * Parse a for loop. 1229 * @param p The parser. 1230 */ 1231 static void 1232 bc_parse_for(BcParse* p) 1233 { 1234 size_t cond_idx, exit_idx, body_idx, update_idx; 1235 1236 // Barf on the missing left paren. 1237 bc_lex_next(&p->l); 1238 if (BC_ERR(p->l.t != BC_LEX_LPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1239 bc_lex_next(&p->l); 1240 1241 // The first statement can be empty, but if it is, check for error in POSIX 1242 // mode. Otherwise, parse it. 1243 if (p->l.t != BC_LEX_SCOLON) bc_parse_expr_status(p, 0, bc_parse_next_for); 1244 else bc_parse_err(p, BC_ERR_POSIX_FOR); 1245 1246 // Must have a semicolon. 1247 if (BC_ERR(p->l.t != BC_LEX_SCOLON)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1248 bc_lex_next(&p->l); 1249 1250 // These are indices for labels. There are so many of them because the end 1251 // of the loop must unconditionally jump to the update code. Then the update 1252 // code must unconditionally jump to the condition code. Then the condition 1253 // code must *conditionally* jump to the exit. 1254 cond_idx = p->func->labels.len; 1255 update_idx = cond_idx + 1; 1256 body_idx = update_idx + 1; 1257 exit_idx = body_idx + 1; 1258 1259 // This creates the condition label. 1260 bc_parse_createLabel(p, p->func->code.len); 1261 1262 // Parse an expression if it exists. 1263 if (p->l.t != BC_LEX_SCOLON) 1264 { 1265 uint8_t flags = (BC_PARSE_REL | BC_PARSE_NEEDVAL); 1266 bc_parse_expr_status(p, flags, bc_parse_next_for); 1267 } 1268 else 1269 { 1270 // Set this for the next call to bc_parse_number because an empty 1271 // condition means that it is an infinite loop, so the condition must be 1272 // non-zero. This is safe to set because the current token is a 1273 // semicolon, which has no string requirement. 1274 bc_vec_string(&p->l.str, sizeof(bc_parse_one) - 1, bc_parse_one); 1275 bc_parse_number(p); 1276 1277 // An empty condition makes POSIX mad. 1278 bc_parse_err(p, BC_ERR_POSIX_FOR); 1279 } 1280 1281 // Must have a semicolon. 1282 if (BC_ERR(p->l.t != BC_LEX_SCOLON)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1283 bc_lex_next(&p->l); 1284 1285 // Now we can set up the conditional jump to the exit and an unconditional 1286 // jump to the body right after. The unconditional jump to the body is 1287 // because there is update code coming right after the condition, so we need 1288 // to skip it to get to the body. 1289 bc_parse_push(p, BC_INST_JUMP_ZERO); 1290 bc_parse_pushIndex(p, exit_idx); 1291 bc_parse_push(p, BC_INST_JUMP); 1292 bc_parse_pushIndex(p, body_idx); 1293 1294 // Now create the label for the update code. 1295 bc_parse_createCondLabel(p, update_idx); 1296 1297 // Parse if not empty, and if it is, let POSIX yell if necessary. 1298 if (p->l.t != BC_LEX_RPAREN) bc_parse_expr_status(p, 0, bc_parse_next_rel); 1299 else bc_parse_err(p, BC_ERR_POSIX_FOR); 1300 1301 // Must have a right paren. 1302 if (BC_ERR(p->l.t != BC_LEX_RPAREN)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1303 1304 // Set up a jump to the condition right after the update code. 1305 bc_parse_push(p, BC_INST_JUMP); 1306 bc_parse_pushIndex(p, cond_idx); 1307 bc_parse_createLabel(p, p->func->code.len); 1308 1309 // Create an exit label for the body and start the body. 1310 bc_parse_createExitLabel(p, exit_idx, true); 1311 bc_lex_next(&p->l); 1312 bc_parse_startBody(p, BC_PARSE_FLAG_LOOP | BC_PARSE_FLAG_LOOP_INNER); 1313 } 1314 1315 /** 1316 * Parse a statement or token that indicates a loop exit. This includes an 1317 * actual loop exit, the break keyword, or the continue keyword. 1318 * @param p The parser. 1319 * @param type The type of exit. 1320 */ 1321 static void 1322 bc_parse_loopExit(BcParse* p, BcLexType type) 1323 { 1324 size_t i; 1325 BcInstPtr* ip; 1326 1327 // Must have a loop. If we don't, that's an error. 1328 if (BC_ERR(!BC_PARSE_LOOP(p))) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1329 1330 // If we have a break statement... 1331 if (type == BC_LEX_KW_BREAK) 1332 { 1333 // If there are no exits, something went wrong somewhere. 1334 if (BC_ERR(!p->exits.len)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1335 1336 // Get the exit. 1337 i = p->exits.len - 1; 1338 ip = bc_vec_item(&p->exits, i); 1339 1340 // The condition !ip->func is true if the exit is not for a loop, so we 1341 // need to find the first actual loop exit. 1342 while (!ip->func && i < p->exits.len) 1343 { 1344 ip = bc_vec_item(&p->exits, i); 1345 i -= 1; 1346 } 1347 1348 // Make sure everything is hunky dory. 1349 assert(ip != NULL && (i < p->exits.len || ip->func)); 1350 1351 // Set the index for the exit. 1352 i = ip->idx; 1353 } 1354 // If we have a continue statement or just the loop end, jump to the 1355 // condition (or update for a foor loop). 1356 else i = *((size_t*) bc_vec_top(&p->conds)); 1357 1358 // Add the unconditional jump. 1359 bc_parse_push(p, BC_INST_JUMP); 1360 bc_parse_pushIndex(p, i); 1361 1362 bc_lex_next(&p->l); 1363 } 1364 1365 /** 1366 * Parse a function (header). 1367 * @param p The parser. 1368 */ 1369 static void 1370 bc_parse_func(BcParse* p) 1371 { 1372 bool comma = false, voidfn; 1373 uint16_t flags; 1374 size_t idx; 1375 1376 bc_lex_next(&p->l); 1377 1378 // Must have a name. 1379 if (BC_ERR(p->l.t != BC_LEX_NAME)) bc_parse_err(p, BC_ERR_PARSE_FUNC); 1380 1381 // If the name is "void", and POSIX is not on, mark as void. 1382 voidfn = (!BC_IS_POSIX && p->l.t == BC_LEX_NAME && 1383 !strcmp(p->l.str.v, "void")); 1384 1385 // We can safely do this because the expected token should not overwrite the 1386 // function name. 1387 bc_lex_next(&p->l); 1388 1389 // If we *don't* have another name, then void is the name of the function. 1390 voidfn = (voidfn && p->l.t == BC_LEX_NAME); 1391 1392 // With a void function, allow POSIX to complain and get a new token. 1393 if (voidfn) 1394 { 1395 bc_parse_err(p, BC_ERR_POSIX_VOID); 1396 1397 // We can safely do this because the expected token should not overwrite 1398 // the function name. 1399 bc_lex_next(&p->l); 1400 } 1401 1402 // Must have a left paren. 1403 if (BC_ERR(p->l.t != BC_LEX_LPAREN)) bc_parse_err(p, BC_ERR_PARSE_FUNC); 1404 1405 // Make sure the functions map and vector are synchronized. 1406 assert(p->prog->fns.len == p->prog->fn_map.len); 1407 1408 // Insert the function by name into the map and vector. 1409 idx = bc_program_insertFunc(p->prog, p->l.str.v); 1410 1411 // Make sure the insert worked. 1412 assert(idx); 1413 1414 // Update the function pointer and stuff in the parser and set its void. 1415 bc_parse_updateFunc(p, idx); 1416 p->func->voidfn = voidfn; 1417 1418 bc_lex_next(&p->l); 1419 1420 // While we do not have a right paren, we are still parsing arguments. 1421 while (p->l.t != BC_LEX_RPAREN) 1422 { 1423 BcType t = BC_TYPE_VAR; 1424 1425 // If we have an asterisk, we are parsing a reference argument. 1426 if (p->l.t == BC_LEX_OP_MULTIPLY) 1427 { 1428 t = BC_TYPE_REF; 1429 bc_lex_next(&p->l); 1430 1431 // Let POSIX complain if necessary. 1432 bc_parse_err(p, BC_ERR_POSIX_REF); 1433 } 1434 1435 // If we don't have a name, the argument will not have a name. Barf. 1436 if (BC_ERR(p->l.t != BC_LEX_NAME)) bc_parse_err(p, BC_ERR_PARSE_FUNC); 1437 1438 // Increment the number of parameters. 1439 p->func->nparams += 1; 1440 1441 // Copy the string in the lexer so that we can use the lexer again. 1442 bc_vec_string(&p->buf, p->l.str.len, p->l.str.v); 1443 1444 bc_lex_next(&p->l); 1445 1446 // We are parsing an array parameter if this is true. 1447 if (p->l.t == BC_LEX_LBRACKET) 1448 { 1449 // Set the array type, unless we are already parsing a reference. 1450 if (t == BC_TYPE_VAR) t = BC_TYPE_ARRAY; 1451 1452 bc_lex_next(&p->l); 1453 1454 // The brackets *must* be empty. 1455 if (BC_ERR(p->l.t != BC_LEX_RBRACKET)) 1456 { 1457 bc_parse_err(p, BC_ERR_PARSE_FUNC); 1458 } 1459 1460 bc_lex_next(&p->l); 1461 } 1462 // If we did *not* get a bracket, but we are expecting a reference, we 1463 // have a problem. 1464 else if (BC_ERR(t == BC_TYPE_REF)) 1465 { 1466 bc_parse_verr(p, BC_ERR_PARSE_REF_VAR, p->buf.v); 1467 } 1468 1469 // Test for comma and get the next token if it exists. 1470 comma = (p->l.t == BC_LEX_COMMA); 1471 if (comma) bc_lex_next(&p->l); 1472 1473 // Insert the parameter into the function. 1474 bc_func_insert(p->func, p->prog, p->buf.v, t, p->l.line); 1475 } 1476 1477 // If we have a comma, but no parameter, barf. 1478 if (BC_ERR(comma)) bc_parse_err(p, BC_ERR_PARSE_FUNC); 1479 1480 // Start the body. 1481 flags = BC_PARSE_FLAG_FUNC | BC_PARSE_FLAG_FUNC_INNER; 1482 bc_parse_startBody(p, flags); 1483 1484 bc_lex_next(&p->l); 1485 1486 // POSIX requires that a brace be on the same line as the function header. 1487 // If we don't have a brace, let POSIX throw an error. 1488 if (p->l.t != BC_LEX_LBRACE) bc_parse_err(p, BC_ERR_POSIX_BRACE); 1489 } 1490 1491 /** 1492 * Parse an auto list. 1493 * @param p The parser. 1494 */ 1495 static void 1496 bc_parse_auto(BcParse* p) 1497 { 1498 bool comma, one; 1499 1500 // Error if the auto keyword appeared in the wrong place. 1501 if (BC_ERR(!p->auto_part)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1502 bc_lex_next(&p->l); 1503 1504 p->auto_part = comma = false; 1505 1506 // We need at least one variable or array. 1507 one = (p->l.t == BC_LEX_NAME); 1508 1509 // While we have a variable or array. 1510 while (p->l.t == BC_LEX_NAME) 1511 { 1512 BcType t; 1513 1514 // Copy the name from the lexer, so we can use it again. 1515 bc_vec_string(&p->buf, p->l.str.len - 1, p->l.str.v); 1516 1517 bc_lex_next(&p->l); 1518 1519 // If we are parsing an array... 1520 if (p->l.t == BC_LEX_LBRACKET) 1521 { 1522 t = BC_TYPE_ARRAY; 1523 1524 bc_lex_next(&p->l); 1525 1526 // The brackets *must* be empty. 1527 if (BC_ERR(p->l.t != BC_LEX_RBRACKET)) 1528 { 1529 bc_parse_err(p, BC_ERR_PARSE_FUNC); 1530 } 1531 1532 bc_lex_next(&p->l); 1533 } 1534 else t = BC_TYPE_VAR; 1535 1536 // Test for comma and get the next token if it exists. 1537 comma = (p->l.t == BC_LEX_COMMA); 1538 if (comma) bc_lex_next(&p->l); 1539 1540 // Insert the auto into the function. 1541 bc_func_insert(p->func, p->prog, p->buf.v, t, p->l.line); 1542 } 1543 1544 // If we have a comma, but no auto, barf. 1545 if (BC_ERR(comma)) bc_parse_err(p, BC_ERR_PARSE_FUNC); 1546 1547 // If we don't have any variables or arrays, barf. 1548 if (BC_ERR(!one)) bc_parse_err(p, BC_ERR_PARSE_NO_AUTO); 1549 1550 // The auto statement should be all that's in the statement. 1551 if (BC_ERR(!bc_parse_isDelimiter(p))) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1552 } 1553 1554 /** 1555 * Parses a body. 1556 * @param p The parser. 1557 * @param brace True if a brace was encountered, false otherwise. 1558 */ 1559 static void 1560 bc_parse_body(BcParse* p, bool brace) 1561 { 1562 uint16_t* flag_ptr = BC_PARSE_TOP_FLAG_PTR(p); 1563 1564 assert(flag_ptr != NULL); 1565 assert(p->flags.len >= 2); 1566 1567 // The body flag is for when we expect a body. We got a body, so clear the 1568 // flag. 1569 *flag_ptr &= ~(BC_PARSE_FLAG_BODY); 1570 1571 // If we are inside a function, that means we just barely entered it, and 1572 // we can expect an auto list. 1573 if (*flag_ptr & BC_PARSE_FLAG_FUNC_INNER) 1574 { 1575 // We *must* have a brace in this case. 1576 if (BC_ERR(!brace)) bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1577 1578 p->auto_part = (p->l.t != BC_LEX_KW_AUTO); 1579 1580 if (!p->auto_part) 1581 { 1582 // Make sure this is true to not get a parse error. 1583 p->auto_part = true; 1584 1585 // Since we already have the auto keyword, parse. 1586 bc_parse_auto(p); 1587 } 1588 1589 // Eat a newline. 1590 if (p->l.t == BC_LEX_NLINE) bc_lex_next(&p->l); 1591 } 1592 else 1593 { 1594 // This is the easy part. 1595 size_t len = p->flags.len; 1596 1597 assert(*flag_ptr); 1598 1599 // Parse a statement. 1600 bc_parse_stmt(p); 1601 1602 // This is a very important condition to get right. If there is no 1603 // brace, and no body flag, and the flags len hasn't shrunk, then we 1604 // have a body that was not delimited by braces, so we need to end it 1605 // now, after just one statement. 1606 if (!brace && !BC_PARSE_BODY(p) && len <= p->flags.len) 1607 { 1608 bc_parse_endBody(p, false); 1609 } 1610 } 1611 } 1612 1613 /** 1614 * Parses a statement. This is the entry point for just about everything, except 1615 * function definitions. 1616 * @param p The parser. 1617 */ 1618 static void 1619 bc_parse_stmt(BcParse* p) 1620 { 1621 size_t len; 1622 uint16_t flags; 1623 BcLexType type = p->l.t; 1624 1625 // Eat newline. 1626 if (type == BC_LEX_NLINE) 1627 { 1628 bc_lex_next(&p->l); 1629 return; 1630 } 1631 1632 // Eat auto list. 1633 if (type == BC_LEX_KW_AUTO) 1634 { 1635 bc_parse_auto(p); 1636 return; 1637 } 1638 1639 // If we reach this point, no auto list is allowed. 1640 p->auto_part = false; 1641 1642 // Everything but an else needs to be taken care of here, but else is 1643 // special. 1644 if (type != BC_LEX_KW_ELSE) 1645 { 1646 // After an if, no else found. 1647 if (BC_PARSE_IF_END(p)) 1648 { 1649 // Clear the expectation for else, end body, and return. Returning 1650 // gives us a clean slate for parsing again. 1651 bc_parse_noElse(p); 1652 if (p->flags.len > 1 && !BC_PARSE_BRACE(p)) 1653 { 1654 bc_parse_endBody(p, false); 1655 } 1656 1657 return; 1658 } 1659 // With a left brace, we are parsing a body. 1660 else if (type == BC_LEX_LBRACE) 1661 { 1662 // We need to start a body if we are not expecting one yet. 1663 if (!BC_PARSE_BODY(p)) 1664 { 1665 bc_parse_startBody(p, BC_PARSE_FLAG_BRACE); 1666 bc_lex_next(&p->l); 1667 } 1668 // If we *are* expecting a body, that body should get a brace. This 1669 // takes care of braces being on a different line than if and loop 1670 // headers. 1671 else 1672 { 1673 *(BC_PARSE_TOP_FLAG_PTR(p)) |= BC_PARSE_FLAG_BRACE; 1674 bc_lex_next(&p->l); 1675 bc_parse_body(p, true); 1676 } 1677 1678 // If we have reached this point, we need to return for a clean 1679 // slate. 1680 return; 1681 } 1682 // This happens when we are expecting a body and get a single statement, 1683 // i.e., a body with no braces surrounding it. Returns after for a clean 1684 // slate. 1685 else if (BC_PARSE_BODY(p) && !BC_PARSE_BRACE(p)) 1686 { 1687 bc_parse_body(p, false); 1688 return; 1689 } 1690 } 1691 1692 len = p->flags.len; 1693 flags = BC_PARSE_TOP_FLAG(p); 1694 1695 switch (type) 1696 { 1697 // All of these are valid for expressions. 1698 case BC_LEX_OP_INC: 1699 case BC_LEX_OP_DEC: 1700 case BC_LEX_OP_MINUS: 1701 case BC_LEX_OP_BOOL_NOT: 1702 case BC_LEX_LPAREN: 1703 case BC_LEX_NAME: 1704 case BC_LEX_NUMBER: 1705 case BC_LEX_KW_IBASE: 1706 case BC_LEX_KW_LAST: 1707 case BC_LEX_KW_LENGTH: 1708 case BC_LEX_KW_OBASE: 1709 case BC_LEX_KW_SCALE: 1710 #if BC_ENABLE_EXTRA_MATH 1711 case BC_LEX_KW_SEED: 1712 #endif // BC_ENABLE_EXTRA_MATH 1713 case BC_LEX_KW_SQRT: 1714 case BC_LEX_KW_ABS: 1715 case BC_LEX_KW_IS_NUMBER: 1716 case BC_LEX_KW_IS_STRING: 1717 #if BC_ENABLE_EXTRA_MATH 1718 case BC_LEX_KW_IRAND: 1719 #endif // BC_ENABLE_EXTRA_MATH 1720 case BC_LEX_KW_ASCIIFY: 1721 case BC_LEX_KW_MODEXP: 1722 case BC_LEX_KW_DIVMOD: 1723 case BC_LEX_KW_READ: 1724 #if BC_ENABLE_EXTRA_MATH 1725 case BC_LEX_KW_RAND: 1726 #endif // BC_ENABLE_EXTRA_MATH 1727 case BC_LEX_KW_MAXIBASE: 1728 case BC_LEX_KW_MAXOBASE: 1729 case BC_LEX_KW_MAXSCALE: 1730 #if BC_ENABLE_EXTRA_MATH 1731 case BC_LEX_KW_MAXRAND: 1732 #endif // BC_ENABLE_EXTRA_MATH 1733 case BC_LEX_KW_LINE_LENGTH: 1734 case BC_LEX_KW_GLOBAL_STACKS: 1735 case BC_LEX_KW_LEADING_ZERO: 1736 { 1737 bc_parse_expr_status(p, BC_PARSE_PRINT, bc_parse_next_expr); 1738 break; 1739 } 1740 1741 case BC_LEX_KW_ELSE: 1742 { 1743 bc_parse_else(p); 1744 break; 1745 } 1746 1747 // Just eat. 1748 case BC_LEX_SCOLON: 1749 { 1750 // Do nothing. 1751 break; 1752 } 1753 1754 case BC_LEX_RBRACE: 1755 { 1756 bc_parse_endBody(p, true); 1757 break; 1758 } 1759 1760 case BC_LEX_STR: 1761 { 1762 bc_parse_str(p, BC_INST_PRINT_STR); 1763 break; 1764 } 1765 1766 case BC_LEX_KW_BREAK: 1767 case BC_LEX_KW_CONTINUE: 1768 { 1769 bc_parse_loopExit(p, p->l.t); 1770 break; 1771 } 1772 1773 case BC_LEX_KW_FOR: 1774 { 1775 bc_parse_for(p); 1776 break; 1777 } 1778 1779 case BC_LEX_KW_HALT: 1780 { 1781 bc_parse_push(p, BC_INST_HALT); 1782 bc_lex_next(&p->l); 1783 break; 1784 } 1785 1786 case BC_LEX_KW_IF: 1787 { 1788 bc_parse_if(p); 1789 break; 1790 } 1791 1792 case BC_LEX_KW_LIMITS: 1793 { 1794 // `limits` is a compile-time command, so execute it right away. 1795 bc_vm_printf("BC_LONG_BIT = %lu\n", (ulong) BC_LONG_BIT); 1796 bc_vm_printf("BC_BASE_DIGS = %lu\n", (ulong) BC_BASE_DIGS); 1797 bc_vm_printf("BC_BASE_POW = %lu\n", (ulong) BC_BASE_POW); 1798 bc_vm_printf("BC_OVERFLOW_MAX = %lu\n", (ulong) BC_NUM_BIGDIG_MAX); 1799 bc_vm_printf("\n"); 1800 bc_vm_printf("BC_BASE_MAX = %lu\n", BC_MAX_OBASE); 1801 bc_vm_printf("BC_DIM_MAX = %lu\n", BC_MAX_DIM); 1802 bc_vm_printf("BC_SCALE_MAX = %lu\n", BC_MAX_SCALE); 1803 bc_vm_printf("BC_STRING_MAX = %lu\n", BC_MAX_STRING); 1804 bc_vm_printf("BC_NAME_MAX = %lu\n", BC_MAX_NAME); 1805 bc_vm_printf("BC_NUM_MAX = %lu\n", BC_MAX_NUM); 1806 #if BC_ENABLE_EXTRA_MATH 1807 bc_vm_printf("BC_RAND_MAX = %lu\n", BC_MAX_RAND); 1808 #endif // BC_ENABLE_EXTRA_MATH 1809 bc_vm_printf("MAX Exponent = %lu\n", BC_MAX_EXP); 1810 bc_vm_printf("Number of vars = %lu\n", BC_MAX_VARS); 1811 1812 bc_lex_next(&p->l); 1813 1814 break; 1815 } 1816 1817 case BC_LEX_KW_STREAM: 1818 case BC_LEX_KW_PRINT: 1819 { 1820 bc_parse_print(p, type); 1821 break; 1822 } 1823 1824 case BC_LEX_KW_QUIT: 1825 { 1826 // Quit is a compile-time command. We don't exit directly, so the vm 1827 // can clean up. 1828 vm->status = BC_STATUS_QUIT; 1829 BC_JMP; 1830 break; 1831 } 1832 1833 case BC_LEX_KW_RETURN: 1834 { 1835 bc_parse_return(p); 1836 break; 1837 } 1838 1839 case BC_LEX_KW_WHILE: 1840 { 1841 bc_parse_while(p); 1842 break; 1843 } 1844 1845 case BC_LEX_EOF: 1846 case BC_LEX_INVALID: 1847 case BC_LEX_NEG: 1848 #if BC_ENABLE_EXTRA_MATH 1849 case BC_LEX_OP_TRUNC: 1850 #endif // BC_ENABLE_EXTRA_MATH 1851 case BC_LEX_OP_POWER: 1852 case BC_LEX_OP_MULTIPLY: 1853 case BC_LEX_OP_DIVIDE: 1854 case BC_LEX_OP_MODULUS: 1855 case BC_LEX_OP_PLUS: 1856 #if BC_ENABLE_EXTRA_MATH 1857 case BC_LEX_OP_PLACES: 1858 case BC_LEX_OP_LSHIFT: 1859 case BC_LEX_OP_RSHIFT: 1860 #endif // BC_ENABLE_EXTRA_MATH 1861 case BC_LEX_OP_REL_EQ: 1862 case BC_LEX_OP_REL_LE: 1863 case BC_LEX_OP_REL_GE: 1864 case BC_LEX_OP_REL_NE: 1865 case BC_LEX_OP_REL_LT: 1866 case BC_LEX_OP_REL_GT: 1867 case BC_LEX_OP_BOOL_OR: 1868 case BC_LEX_OP_BOOL_AND: 1869 case BC_LEX_OP_ASSIGN_POWER: 1870 case BC_LEX_OP_ASSIGN_MULTIPLY: 1871 case BC_LEX_OP_ASSIGN_DIVIDE: 1872 case BC_LEX_OP_ASSIGN_MODULUS: 1873 case BC_LEX_OP_ASSIGN_PLUS: 1874 case BC_LEX_OP_ASSIGN_MINUS: 1875 #if BC_ENABLE_EXTRA_MATH 1876 case BC_LEX_OP_ASSIGN_PLACES: 1877 case BC_LEX_OP_ASSIGN_LSHIFT: 1878 case BC_LEX_OP_ASSIGN_RSHIFT: 1879 #endif // BC_ENABLE_EXTRA_MATH 1880 case BC_LEX_OP_ASSIGN: 1881 case BC_LEX_NLINE: 1882 case BC_LEX_WHITESPACE: 1883 case BC_LEX_RPAREN: 1884 case BC_LEX_LBRACKET: 1885 case BC_LEX_COMMA: 1886 case BC_LEX_RBRACKET: 1887 case BC_LEX_LBRACE: 1888 case BC_LEX_KW_AUTO: 1889 case BC_LEX_KW_DEFINE: 1890 #if DC_ENABLED 1891 case BC_LEX_EXTENDED_REGISTERS: 1892 case BC_LEX_EQ_NO_REG: 1893 case BC_LEX_COLON: 1894 case BC_LEX_EXECUTE: 1895 case BC_LEX_PRINT_STACK: 1896 case BC_LEX_CLEAR_STACK: 1897 case BC_LEX_REG_STACK_LEVEL: 1898 case BC_LEX_STACK_LEVEL: 1899 case BC_LEX_DUPLICATE: 1900 case BC_LEX_SWAP: 1901 case BC_LEX_POP: 1902 case BC_LEX_STORE_IBASE: 1903 case BC_LEX_STORE_OBASE: 1904 case BC_LEX_STORE_SCALE: 1905 #if BC_ENABLE_EXTRA_MATH 1906 case BC_LEX_STORE_SEED: 1907 #endif // BC_ENABLE_EXTRA_MATH 1908 case BC_LEX_LOAD: 1909 case BC_LEX_LOAD_POP: 1910 case BC_LEX_STORE_PUSH: 1911 case BC_LEX_PRINT_POP: 1912 case BC_LEX_NQUIT: 1913 case BC_LEX_EXEC_STACK_LENGTH: 1914 case BC_LEX_SCALE_FACTOR: 1915 case BC_LEX_ARRAY_LENGTH: 1916 #endif // DC_ENABLED 1917 { 1918 bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1919 } 1920 } 1921 1922 // If the flags did not change, we expect a delimiter. 1923 if (len == p->flags.len && flags == BC_PARSE_TOP_FLAG(p)) 1924 { 1925 if (BC_ERR(!bc_parse_isDelimiter(p))) 1926 { 1927 bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1928 } 1929 } 1930 1931 // Make sure semicolons are eaten. 1932 while (p->l.t == BC_LEX_SCOLON || p->l.t == BC_LEX_NLINE) 1933 { 1934 bc_lex_next(&p->l); 1935 } 1936 1937 // POSIX's grammar does not allow a function definition after a semicolon 1938 // without a newline, so check specifically for that case and error if 1939 // the POSIX standard flag is set. 1940 if (p->l.last == BC_LEX_SCOLON && p->l.t == BC_LEX_KW_DEFINE && BC_IS_POSIX) 1941 { 1942 bc_parse_err(p, BC_ERR_POSIX_FUNC_AFTER_SEMICOLON); 1943 } 1944 } 1945 1946 void 1947 bc_parse_parse(BcParse* p) 1948 { 1949 assert(p); 1950 1951 BC_SETJMP_LOCKED(vm, exit); 1952 1953 // We should not let an EOF get here unless some partial parse was not 1954 // completed, in which case, it's the user's fault. 1955 if (BC_ERR(p->l.t == BC_LEX_EOF)) bc_parse_err(p, BC_ERR_PARSE_EOF); 1956 1957 // Functions need special parsing. 1958 else if (p->l.t == BC_LEX_KW_DEFINE) 1959 { 1960 if (BC_ERR(BC_PARSE_NO_EXEC(p))) 1961 { 1962 bc_parse_endif(p); 1963 if (BC_ERR(BC_PARSE_NO_EXEC(p))) 1964 { 1965 bc_parse_err(p, BC_ERR_PARSE_TOKEN); 1966 } 1967 } 1968 bc_parse_func(p); 1969 } 1970 1971 // Otherwise, parse a normal statement. 1972 else bc_parse_stmt(p); 1973 1974 exit: 1975 1976 // We need to reset on error. 1977 if (BC_ERR(((vm->status && vm->status != BC_STATUS_QUIT) || vm->sig != 0))) 1978 { 1979 bc_parse_reset(p); 1980 } 1981 1982 BC_LONGJMP_CONT(vm); 1983 BC_SIG_MAYLOCK; 1984 } 1985 1986 /** 1987 * Parse an expression. This is the actual implementation of the Shunting-Yard 1988 * Algorithm. 1989 * @param p The parser. 1990 * @param flags The flags for what is valid in the expression. 1991 * @param next A set of tokens for what is valid *after* the expression. 1992 * @return A parse status. In some places, an empty expression is an 1993 * error, and sometimes, it is required. This allows this function 1994 * to tell the caller if the expression was empty and let the 1995 * caller handle it. 1996 */ 1997 static BcParseStatus 1998 bc_parse_expr_err(BcParse* p, uint8_t flags, BcParseNext next) 1999 { 2000 BcInst prev = BC_INST_PRINT; 2001 uchar inst = BC_INST_INVALID; 2002 BcLexType top, t; 2003 size_t nexprs, ops_bgn; 2004 uint32_t i, nparens, nrelops; 2005 bool pfirst, rprn, array_last, done, get_token, assign; 2006 bool bin_last, incdec, can_assign; 2007 2008 // One of these *must* be true. 2009 assert(!(flags & BC_PARSE_PRINT) || !(flags & BC_PARSE_NEEDVAL)); 2010 2011 // These are set very carefully. In fact, controlling the values of these 2012 // locals is the biggest part of making this work. ops_bgn especially is 2013 // important because it marks where the operator stack begins for *this* 2014 // invocation of this function. That's because bc_parse_expr_err() is 2015 // recursive (the Shunting-Yard Algorithm is most easily expressed 2016 // recursively when parsing subexpressions), and each invocation needs to 2017 // know where to stop. 2018 // 2019 // - nparens is the number of left parens without matches. 2020 // - nrelops is the number of relational operators that appear in the expr. 2021 // - nexprs is the number of unused expressions. 2022 // - rprn is a right paren encountered last. 2023 // - array_last is an array item encountered last. 2024 // - done means the expression has been fully parsed. 2025 // - get_token is true when a token is needed at the end of an iteration. 2026 // - assign is true when an assignment statement was parsed last. 2027 // - incdec is true when the previous operator was an inc or dec operator. 2028 // - can_assign is true when an assignemnt is valid. 2029 // - bin_last is true when the previous instruction was a binary operator. 2030 t = p->l.t; 2031 pfirst = (p->l.t == BC_LEX_LPAREN); 2032 nparens = nrelops = 0; 2033 nexprs = 0; 2034 ops_bgn = p->ops.len; 2035 rprn = array_last = done = get_token = assign = incdec = can_assign = false; 2036 bin_last = true; 2037 2038 // We want to eat newlines if newlines are not a valid ending token. 2039 // This is for spacing in things like for loop headers. 2040 if (!(flags & BC_PARSE_NOREAD)) 2041 { 2042 while ((t = p->l.t) == BC_LEX_NLINE) 2043 { 2044 bc_lex_next(&p->l); 2045 } 2046 } 2047 2048 // This is the Shunting-Yard algorithm loop. 2049 for (; !done && BC_PARSE_EXPR(t); t = p->l.t) 2050 { 2051 // Make sure an array expression is not mixed with any others. However, 2052 // a right parenthesis may end the expression, so we will need to take 2053 // care of that right there. 2054 if (BC_ERR(array_last && t != BC_LEX_RPAREN)) 2055 { 2056 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2057 } 2058 2059 switch (t) 2060 { 2061 case BC_LEX_OP_INC: 2062 case BC_LEX_OP_DEC: 2063 { 2064 // These operators can only be used with items that can be 2065 // assigned to. 2066 if (BC_ERR(incdec)) bc_parse_err(p, BC_ERR_PARSE_ASSIGN); 2067 2068 bc_parse_incdec(p, &prev, &can_assign, &nexprs, flags); 2069 2070 rprn = get_token = bin_last = false; 2071 incdec = true; 2072 flags &= ~(BC_PARSE_ARRAY); 2073 2074 break; 2075 } 2076 2077 #if BC_ENABLE_EXTRA_MATH 2078 case BC_LEX_OP_TRUNC: 2079 { 2080 // The previous token must have been a leaf expression, or the 2081 // operator is in the wrong place. 2082 if (BC_ERR(!BC_PARSE_LEAF(prev, bin_last, rprn))) 2083 { 2084 bc_parse_err(p, BC_ERR_PARSE_TOKEN); 2085 } 2086 2087 // I can just add the instruction because 2088 // negative will already be taken care of. 2089 bc_parse_push(p, BC_INST_TRUNC); 2090 2091 rprn = can_assign = incdec = false; 2092 get_token = true; 2093 flags &= ~(BC_PARSE_ARRAY); 2094 2095 break; 2096 } 2097 #endif // BC_ENABLE_EXTRA_MATH 2098 2099 case BC_LEX_OP_MINUS: 2100 { 2101 bc_parse_minus(p, &prev, ops_bgn, rprn, bin_last, &nexprs); 2102 2103 rprn = get_token = can_assign = false; 2104 2105 // This is true if it was a binary operator last. 2106 bin_last = (prev == BC_INST_MINUS); 2107 if (bin_last) incdec = false; 2108 2109 flags &= ~(BC_PARSE_ARRAY); 2110 2111 break; 2112 } 2113 2114 // All of this group, including the fallthrough, is to parse binary 2115 // operators. 2116 case BC_LEX_OP_ASSIGN_POWER: 2117 case BC_LEX_OP_ASSIGN_MULTIPLY: 2118 case BC_LEX_OP_ASSIGN_DIVIDE: 2119 case BC_LEX_OP_ASSIGN_MODULUS: 2120 case BC_LEX_OP_ASSIGN_PLUS: 2121 case BC_LEX_OP_ASSIGN_MINUS: 2122 #if BC_ENABLE_EXTRA_MATH 2123 case BC_LEX_OP_ASSIGN_PLACES: 2124 case BC_LEX_OP_ASSIGN_LSHIFT: 2125 case BC_LEX_OP_ASSIGN_RSHIFT: 2126 #endif // BC_ENABLE_EXTRA_MATH 2127 case BC_LEX_OP_ASSIGN: 2128 { 2129 // We need to make sure the assignment is valid. 2130 if (!BC_PARSE_INST_VAR(prev)) 2131 { 2132 bc_parse_err(p, BC_ERR_PARSE_ASSIGN); 2133 } 2134 2135 // Fallthrough. 2136 BC_FALLTHROUGH 2137 } 2138 2139 case BC_LEX_OP_POWER: 2140 case BC_LEX_OP_MULTIPLY: 2141 case BC_LEX_OP_DIVIDE: 2142 case BC_LEX_OP_MODULUS: 2143 case BC_LEX_OP_PLUS: 2144 #if BC_ENABLE_EXTRA_MATH 2145 case BC_LEX_OP_PLACES: 2146 case BC_LEX_OP_LSHIFT: 2147 case BC_LEX_OP_RSHIFT: 2148 #endif // BC_ENABLE_EXTRA_MATH 2149 case BC_LEX_OP_REL_EQ: 2150 case BC_LEX_OP_REL_LE: 2151 case BC_LEX_OP_REL_GE: 2152 case BC_LEX_OP_REL_NE: 2153 case BC_LEX_OP_REL_LT: 2154 case BC_LEX_OP_REL_GT: 2155 case BC_LEX_OP_BOOL_NOT: 2156 case BC_LEX_OP_BOOL_OR: 2157 case BC_LEX_OP_BOOL_AND: 2158 { 2159 // This is true if the operator if the token is a prefix 2160 // operator. This is only for boolean not. 2161 if (BC_PARSE_OP_PREFIX(t)) 2162 { 2163 // Prefix operators are only allowed after binary operators 2164 // or prefix operators. 2165 if (BC_ERR(!bin_last && !BC_PARSE_OP_PREFIX(p->l.last))) 2166 { 2167 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2168 } 2169 } 2170 // If we execute the else, that means we have a binary operator. 2171 // If the previous operator was a prefix or a binary operator, 2172 // then a binary operator is not allowed. 2173 else if (BC_ERR(BC_PARSE_PREV_PREFIX(prev) || bin_last)) 2174 { 2175 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2176 } 2177 2178 nrelops += (t >= BC_LEX_OP_REL_EQ && t <= BC_LEX_OP_REL_GT); 2179 prev = BC_PARSE_TOKEN_INST(t); 2180 2181 bc_parse_operator(p, t, ops_bgn, &nexprs); 2182 2183 rprn = incdec = can_assign = false; 2184 get_token = true; 2185 bin_last = !BC_PARSE_OP_PREFIX(t); 2186 flags &= ~(BC_PARSE_ARRAY); 2187 2188 break; 2189 } 2190 2191 case BC_LEX_LPAREN: 2192 { 2193 // A left paren is *not* allowed right after a leaf expr. 2194 if (BC_ERR(BC_PARSE_LEAF(prev, bin_last, rprn))) 2195 { 2196 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2197 } 2198 2199 nparens += 1; 2200 rprn = incdec = can_assign = false; 2201 get_token = true; 2202 2203 // Push the paren onto the operator stack. 2204 bc_vec_push(&p->ops, &t); 2205 2206 break; 2207 } 2208 2209 case BC_LEX_RPAREN: 2210 { 2211 // This needs to be a status. The error is handled in 2212 // bc_parse_expr_status(). 2213 if (BC_ERR(p->l.last == BC_LEX_LPAREN)) 2214 { 2215 return BC_PARSE_STATUS_EMPTY_EXPR; 2216 } 2217 2218 // The right paren must not come after a prefix or binary 2219 // operator. 2220 if (BC_ERR(bin_last || BC_PARSE_PREV_PREFIX(prev))) 2221 { 2222 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2223 } 2224 2225 // If there are no parens left, we are done, but we need another 2226 // token. 2227 if (!nparens) 2228 { 2229 done = true; 2230 get_token = false; 2231 break; 2232 } 2233 2234 // Now that we know the right paren has not ended the 2235 // expression, make sure an array expression is not mixed with 2236 // any others. 2237 if (BC_ERR(array_last)) 2238 { 2239 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2240 } 2241 2242 nparens -= 1; 2243 rprn = true; 2244 get_token = bin_last = incdec = false; 2245 2246 bc_parse_rightParen(p, &nexprs); 2247 2248 break; 2249 } 2250 2251 case BC_LEX_STR: 2252 { 2253 // POSIX only allows strings alone. 2254 if (BC_IS_POSIX) bc_parse_err(p, BC_ERR_POSIX_EXPR_STRING); 2255 2256 // A string is a leaf and cannot come right after a leaf. 2257 if (BC_ERR(BC_PARSE_LEAF(prev, bin_last, rprn))) 2258 { 2259 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2260 } 2261 2262 bc_parse_addString(p); 2263 2264 get_token = true; 2265 bin_last = rprn = false; 2266 nexprs += 1; 2267 2268 break; 2269 } 2270 2271 case BC_LEX_NAME: 2272 { 2273 // A name is a leaf and cannot come right after a leaf. 2274 if (BC_ERR(BC_PARSE_LEAF(prev, bin_last, rprn))) 2275 { 2276 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2277 } 2278 2279 get_token = bin_last = false; 2280 2281 bc_parse_name(p, &prev, &can_assign, flags & ~BC_PARSE_NOCALL); 2282 2283 rprn = (prev == BC_INST_CALL); 2284 array_last = (prev == BC_INST_ARRAY); 2285 nexprs += 1; 2286 flags &= ~(BC_PARSE_ARRAY); 2287 2288 break; 2289 } 2290 2291 case BC_LEX_NUMBER: 2292 { 2293 // A number is a leaf and cannot come right after a leaf. 2294 if (BC_ERR(BC_PARSE_LEAF(prev, bin_last, rprn))) 2295 { 2296 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2297 } 2298 2299 // The number instruction is pushed in here. 2300 bc_parse_number(p); 2301 2302 nexprs += 1; 2303 prev = BC_INST_NUM; 2304 get_token = true; 2305 rprn = bin_last = can_assign = false; 2306 flags &= ~(BC_PARSE_ARRAY); 2307 2308 break; 2309 } 2310 2311 case BC_LEX_KW_IBASE: 2312 case BC_LEX_KW_LAST: 2313 case BC_LEX_KW_OBASE: 2314 #if BC_ENABLE_EXTRA_MATH 2315 case BC_LEX_KW_SEED: 2316 #endif // BC_ENABLE_EXTRA_MATH 2317 { 2318 // All of these are leaves and cannot come right after a leaf. 2319 if (BC_ERR(BC_PARSE_LEAF(prev, bin_last, rprn))) 2320 { 2321 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2322 } 2323 2324 prev = t - BC_LEX_KW_LAST + BC_INST_LAST; 2325 bc_parse_push(p, prev); 2326 2327 get_token = can_assign = true; 2328 rprn = bin_last = false; 2329 nexprs += 1; 2330 flags &= ~(BC_PARSE_ARRAY); 2331 2332 break; 2333 } 2334 2335 case BC_LEX_KW_LENGTH: 2336 case BC_LEX_KW_SQRT: 2337 case BC_LEX_KW_ABS: 2338 case BC_LEX_KW_IS_NUMBER: 2339 case BC_LEX_KW_IS_STRING: 2340 #if BC_ENABLE_EXTRA_MATH 2341 case BC_LEX_KW_IRAND: 2342 #endif // BC_ENABLE_EXTRA_MATH 2343 case BC_LEX_KW_ASCIIFY: 2344 { 2345 // All of these are leaves and cannot come right after a leaf. 2346 if (BC_ERR(BC_PARSE_LEAF(prev, bin_last, rprn))) 2347 { 2348 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2349 } 2350 2351 bc_parse_builtin(p, t, flags, &prev); 2352 2353 rprn = get_token = bin_last = incdec = can_assign = false; 2354 nexprs += 1; 2355 flags &= ~(BC_PARSE_ARRAY); 2356 2357 break; 2358 } 2359 2360 case BC_LEX_KW_READ: 2361 #if BC_ENABLE_EXTRA_MATH 2362 case BC_LEX_KW_RAND: 2363 #endif // BC_ENABLE_EXTRA_MATH 2364 case BC_LEX_KW_MAXIBASE: 2365 case BC_LEX_KW_MAXOBASE: 2366 case BC_LEX_KW_MAXSCALE: 2367 #if BC_ENABLE_EXTRA_MATH 2368 case BC_LEX_KW_MAXRAND: 2369 #endif // BC_ENABLE_EXTRA_MATH 2370 case BC_LEX_KW_LINE_LENGTH: 2371 case BC_LEX_KW_GLOBAL_STACKS: 2372 case BC_LEX_KW_LEADING_ZERO: 2373 { 2374 // All of these are leaves and cannot come right after a leaf. 2375 if (BC_ERR(BC_PARSE_LEAF(prev, bin_last, rprn))) 2376 { 2377 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2378 } 2379 2380 // Error if we have read and it's not allowed. 2381 else if (t == BC_LEX_KW_READ && BC_ERR(flags & BC_PARSE_NOREAD)) 2382 { 2383 bc_parse_err(p, BC_ERR_EXEC_REC_READ); 2384 } 2385 2386 prev = t - BC_LEX_KW_READ + BC_INST_READ; 2387 bc_parse_noArgBuiltin(p, prev); 2388 2389 rprn = get_token = bin_last = incdec = can_assign = false; 2390 nexprs += 1; 2391 flags &= ~(BC_PARSE_ARRAY); 2392 2393 break; 2394 } 2395 2396 case BC_LEX_KW_SCALE: 2397 { 2398 // This is a leaf and cannot come right after a leaf. 2399 if (BC_ERR(BC_PARSE_LEAF(prev, bin_last, rprn))) 2400 { 2401 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2402 } 2403 2404 // Scale needs special work because it can be a variable *or* a 2405 // function. 2406 bc_parse_scale(p, &prev, &can_assign, flags); 2407 2408 rprn = get_token = bin_last = false; 2409 nexprs += 1; 2410 flags &= ~(BC_PARSE_ARRAY); 2411 2412 break; 2413 } 2414 2415 case BC_LEX_KW_MODEXP: 2416 case BC_LEX_KW_DIVMOD: 2417 { 2418 // This is a leaf and cannot come right after a leaf. 2419 if (BC_ERR(BC_PARSE_LEAF(prev, bin_last, rprn))) 2420 { 2421 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2422 } 2423 2424 bc_parse_builtin3(p, t, flags, &prev); 2425 2426 rprn = get_token = bin_last = incdec = can_assign = false; 2427 nexprs += 1; 2428 flags &= ~(BC_PARSE_ARRAY); 2429 2430 break; 2431 } 2432 2433 case BC_LEX_EOF: 2434 case BC_LEX_INVALID: 2435 case BC_LEX_NEG: 2436 case BC_LEX_NLINE: 2437 case BC_LEX_WHITESPACE: 2438 case BC_LEX_LBRACKET: 2439 case BC_LEX_COMMA: 2440 case BC_LEX_RBRACKET: 2441 case BC_LEX_LBRACE: 2442 case BC_LEX_SCOLON: 2443 case BC_LEX_RBRACE: 2444 case BC_LEX_KW_AUTO: 2445 case BC_LEX_KW_BREAK: 2446 case BC_LEX_KW_CONTINUE: 2447 case BC_LEX_KW_DEFINE: 2448 case BC_LEX_KW_FOR: 2449 case BC_LEX_KW_IF: 2450 case BC_LEX_KW_LIMITS: 2451 case BC_LEX_KW_RETURN: 2452 case BC_LEX_KW_WHILE: 2453 case BC_LEX_KW_HALT: 2454 case BC_LEX_KW_PRINT: 2455 case BC_LEX_KW_QUIT: 2456 case BC_LEX_KW_STREAM: 2457 case BC_LEX_KW_ELSE: 2458 #if DC_ENABLED 2459 case BC_LEX_EXTENDED_REGISTERS: 2460 case BC_LEX_EQ_NO_REG: 2461 case BC_LEX_COLON: 2462 case BC_LEX_EXECUTE: 2463 case BC_LEX_PRINT_STACK: 2464 case BC_LEX_CLEAR_STACK: 2465 case BC_LEX_REG_STACK_LEVEL: 2466 case BC_LEX_STACK_LEVEL: 2467 case BC_LEX_DUPLICATE: 2468 case BC_LEX_SWAP: 2469 case BC_LEX_POP: 2470 case BC_LEX_STORE_IBASE: 2471 case BC_LEX_STORE_OBASE: 2472 case BC_LEX_STORE_SCALE: 2473 #if BC_ENABLE_EXTRA_MATH 2474 case BC_LEX_STORE_SEED: 2475 #endif // BC_ENABLE_EXTRA_MATH 2476 case BC_LEX_LOAD: 2477 case BC_LEX_LOAD_POP: 2478 case BC_LEX_STORE_PUSH: 2479 case BC_LEX_PRINT_POP: 2480 case BC_LEX_NQUIT: 2481 case BC_LEX_EXEC_STACK_LENGTH: 2482 case BC_LEX_SCALE_FACTOR: 2483 case BC_LEX_ARRAY_LENGTH: 2484 #endif // DC_ENABLED 2485 { 2486 #if BC_DEBUG 2487 // We should never get here, even in debug builds. 2488 bc_parse_err(p, BC_ERR_PARSE_TOKEN); 2489 break; 2490 #endif // BC_DEBUG 2491 } 2492 } 2493 2494 if (get_token) bc_lex_next(&p->l); 2495 } 2496 2497 // Now that we have parsed the expression, we need to empty the operator 2498 // stack. 2499 while (p->ops.len > ops_bgn) 2500 { 2501 top = BC_PARSE_TOP_OP(p); 2502 assign = top >= BC_LEX_OP_ASSIGN_POWER && top <= BC_LEX_OP_ASSIGN; 2503 2504 // There should not be *any* parens on the stack anymore. 2505 if (BC_ERR(top == BC_LEX_LPAREN || top == BC_LEX_RPAREN)) 2506 { 2507 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2508 } 2509 2510 bc_parse_push(p, BC_PARSE_TOKEN_INST(top)); 2511 2512 // Adjust the number of unused expressions. 2513 nexprs -= !BC_PARSE_OP_PREFIX(top); 2514 bc_vec_pop(&p->ops); 2515 2516 incdec = false; 2517 } 2518 2519 // There must be only one expression at the top. 2520 if (BC_ERR(nexprs != 1)) bc_parse_err(p, BC_ERR_PARSE_EXPR); 2521 2522 // Check that the next token is correct. 2523 for (i = 0; i < next.len && t != next.tokens[i]; ++i) 2524 { 2525 continue; 2526 } 2527 if (BC_ERR(i == next.len && !bc_parse_isDelimiter(p))) 2528 { 2529 bc_parse_err(p, BC_ERR_PARSE_EXPR); 2530 } 2531 2532 // Check that POSIX would be happy with the number of relational operators. 2533 if (!(flags & BC_PARSE_REL) && nrelops) 2534 { 2535 bc_parse_err(p, BC_ERR_POSIX_REL_POS); 2536 } 2537 else if ((flags & BC_PARSE_REL) && nrelops > 1) 2538 { 2539 bc_parse_err(p, BC_ERR_POSIX_MULTIREL); 2540 } 2541 2542 // If this is true, then we might be in a situation where we don't print. 2543 // We would want to have the increment/decrement operator not make an extra 2544 // copy if it's not necessary. 2545 if (!(flags & BC_PARSE_NEEDVAL) && !pfirst) 2546 { 2547 // We have the easy case if the last operator was an assignment 2548 // operator. 2549 if (assign) 2550 { 2551 inst = *((uchar*) bc_vec_top(&p->func->code)); 2552 inst += (BC_INST_ASSIGN_POWER_NO_VAL - BC_INST_ASSIGN_POWER); 2553 incdec = false; 2554 } 2555 // If we have an inc/dec operator and we are *not* printing, implement 2556 // the optimization to get rid of the extra copy. 2557 else if (incdec && !(flags & BC_PARSE_PRINT)) 2558 { 2559 inst = *((uchar*) bc_vec_top(&p->func->code)); 2560 incdec = (inst <= BC_INST_DEC); 2561 inst = BC_INST_ASSIGN_PLUS_NO_VAL + 2562 (inst != BC_INST_INC && inst != BC_INST_ASSIGN_PLUS); 2563 } 2564 2565 // This condition allows us to change the previous assignment 2566 // instruction (which does a copy) for a NO_VAL version, which does not. 2567 // This condition is set if either of the above if statements ends up 2568 // being true. 2569 if (inst >= BC_INST_ASSIGN_POWER_NO_VAL && 2570 inst <= BC_INST_ASSIGN_NO_VAL) 2571 { 2572 // Pop the previous assignment instruction and push a new one. 2573 // Inc/dec needs the extra instruction because it is now a binary 2574 // operator and needs a second operand. 2575 bc_vec_pop(&p->func->code); 2576 if (incdec) bc_parse_push(p, BC_INST_ONE); 2577 bc_parse_push(p, inst); 2578 } 2579 } 2580 2581 // If we might have to print... 2582 if ((flags & BC_PARSE_PRINT)) 2583 { 2584 // With a paren first or the last operator not being an assignment, we 2585 // *do* want to print. 2586 if (pfirst || !assign) bc_parse_push(p, BC_INST_PRINT); 2587 } 2588 // We need to make sure to push a pop instruction for assignment statements 2589 // that will not print. The print will pop, but without it, we need to pop. 2590 else if (!(flags & BC_PARSE_NEEDVAL) && 2591 (inst < BC_INST_ASSIGN_POWER_NO_VAL || 2592 inst > BC_INST_ASSIGN_NO_VAL)) 2593 { 2594 bc_parse_push(p, BC_INST_POP); 2595 } 2596 2597 // We want to eat newlines if newlines are not a valid ending token. 2598 // This is for spacing in things like for loop headers. 2599 // 2600 // Yes, this is one case where I reuse a variable for a different purpose; 2601 // in this case, incdec being true now means that newlines are not valid. 2602 for (incdec = true, i = 0; i < next.len && incdec; ++i) 2603 { 2604 incdec = (next.tokens[i] != BC_LEX_NLINE); 2605 } 2606 if (incdec) 2607 { 2608 while (p->l.t == BC_LEX_NLINE) 2609 { 2610 bc_lex_next(&p->l); 2611 } 2612 } 2613 2614 return BC_PARSE_STATUS_SUCCESS; 2615 } 2616 2617 /** 2618 * Parses an expression with bc_parse_expr_err(), but throws an error if it gets 2619 * an empty expression. 2620 * @param p The parser. 2621 * @param flags The flags for what is valid in the expression. 2622 * @param next A set of tokens for what is valid *after* the expression. 2623 */ 2624 static void 2625 bc_parse_expr_status(BcParse* p, uint8_t flags, BcParseNext next) 2626 { 2627 BcParseStatus s = bc_parse_expr_err(p, flags, next); 2628 2629 if (BC_ERR(s == BC_PARSE_STATUS_EMPTY_EXPR)) 2630 { 2631 bc_parse_err(p, BC_ERR_PARSE_EMPTY_EXPR); 2632 } 2633 } 2634 2635 void 2636 bc_parse_expr(BcParse* p, uint8_t flags) 2637 { 2638 assert(p); 2639 bc_parse_expr_status(p, flags, bc_parse_next_read); 2640 } 2641 #endif // BC_ENABLED 2642