1 /* 2 * Copyright (C) 2010 Dan Carpenter. 3 * 4 * This program is free software; you can redistribute it and/or 5 * modify it under the terms of the GNU General Public License 6 * as published by the Free Software Foundation; either version 2 7 * of the License, or (at your option) any later version. 8 * 9 * This program is distributed in the hope that it will be useful, 10 * but WITHOUT ANY WARRANTY; without even the implied warranty of 11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 12 * GNU General Public License for more details. 13 * 14 * You should have received a copy of the GNU General Public License 15 * along with this program; if not, see http://www.gnu.org/copyleft/gpl.txt 16 */ 17 18 #include <string.h> 19 #include <errno.h> 20 #include <unistd.h> 21 #include <ctype.h> 22 #include "smatch.h" 23 #include "smatch_slist.h" 24 #include "smatch_extra.h" 25 26 struct sqlite3 *smatch_db; 27 struct sqlite3 *mem_db; 28 struct sqlite3 *cache_db; 29 30 int debug_db; 31 32 static int return_id; 33 34 static void call_return_state_hooks(struct expression *expr); 35 36 #define SQLITE_CACHE_PAGES 1000 37 38 struct def_callback { 39 int hook_type; 40 void (*callback)(const char *name, struct symbol *sym, char *key, char *value); 41 }; 42 ALLOCATOR(def_callback, "definition db hook callbacks"); 43 DECLARE_PTR_LIST(callback_list, struct def_callback); 44 static struct callback_list *select_caller_info_callbacks; 45 46 struct member_info_callback { 47 int owner; 48 void (*callback)(struct expression *call, int param, char *printed_name, struct sm_state *sm); 49 }; 50 ALLOCATOR(member_info_callback, "caller_info callbacks"); 51 DECLARE_PTR_LIST(member_info_cb_list, struct member_info_callback); 52 static struct member_info_cb_list *member_callbacks; 53 54 struct returned_state_callback { 55 void (*callback)(int return_id, char *return_ranges, struct expression *return_expr); 56 }; 57 ALLOCATOR(returned_state_callback, "returned state callbacks"); 58 DECLARE_PTR_LIST(returned_state_cb_list, struct returned_state_callback); 59 static struct returned_state_cb_list *returned_state_callbacks; 60 61 struct returned_member_callback { 62 int owner; 63 void (*callback)(int return_id, char *return_ranges, struct expression *expr, char *printed_name, struct smatch_state *state); 64 }; 65 ALLOCATOR(returned_member_callback, "returned member callbacks"); 66 DECLARE_PTR_LIST(returned_member_cb_list, struct returned_member_callback); 67 static struct returned_member_cb_list *returned_member_callbacks; 68 69 struct db_implies_callback { 70 int type; 71 void (*callback)(struct expression *call, struct expression *arg, char *key, char *value); 72 }; 73 ALLOCATOR(db_implies_callback, "return_implies callbacks"); 74 DECLARE_PTR_LIST(db_implies_cb_list, struct db_implies_callback); 75 static struct db_implies_cb_list *return_implies_cb_list; 76 static struct db_implies_cb_list *call_implies_cb_list; 77 78 /* silently truncates if needed. */ 79 char *escape_newlines(const char *str) 80 { 81 char buf[1024] = ""; 82 bool found = false; 83 int i, j; 84 85 for (i = 0, j = 0; str[i] != '\0' && j != sizeof(buf); i++, j++) { 86 if (str[i] != '\r' && str[i] != '\n') { 87 buf[j] = str[i]; 88 continue; 89 } 90 91 found = true; 92 buf[j++] = '\\'; 93 if (j == sizeof(buf)) 94 break; 95 buf[j] = 'n'; 96 } 97 98 if (!found) 99 return alloc_sname(str); 100 101 if (j == sizeof(buf)) 102 buf[j - 1] = '\0'; 103 return alloc_sname(buf); 104 } 105 106 static int print_sql_output(void *unused, int argc, char **argv, char **azColName) 107 { 108 int i; 109 110 for (i = 0; i < argc; i++) { 111 if (i != 0) 112 sm_printf(", "); 113 sm_printf("%s", argv[i]); 114 } 115 sm_printf("\n"); 116 return 0; 117 } 118 119 void sql_exec(struct sqlite3 *db, int (*callback)(void*, int, char**, char**), void *data, const char *sql) 120 { 121 char *err = NULL; 122 int rc; 123 124 if (!db) 125 return; 126 127 if (option_debug || debug_db) { 128 sm_msg("%s", sql); 129 if (strncasecmp(sql, "select", strlen("select")) == 0) 130 sqlite3_exec(db, sql, print_sql_output, NULL, NULL); 131 } 132 133 rc = sqlite3_exec(db, sql, callback, data, &err); 134 if (rc != SQLITE_OK && !parse_error) { 135 sm_ierror("%s:%d SQL error #2: %s\n", get_filename(), get_lineno(), err); 136 sm_ierror("%s:%d SQL: '%s'\n", get_filename(), get_lineno(), sql); 137 parse_error = 1; 138 } 139 } 140 141 static int replace_count; 142 static char **replace_table; 143 static const char *replace_return_ranges(const char *return_ranges) 144 { 145 int i; 146 147 if (!get_function()) { 148 /* I have no idea why EXPORT_SYMBOL() is here */ 149 return return_ranges; 150 } 151 for (i = 0; i < replace_count; i += 3) { 152 if (strcmp(replace_table[i + 0], get_function()) == 0) { 153 if (strcmp(replace_table[i + 1], return_ranges) == 0) 154 return replace_table[i + 2]; 155 } 156 } 157 return return_ranges; 158 } 159 160 161 static char *use_states; 162 static int get_db_state_count(void) 163 { 164 struct sm_state *sm; 165 int count = 0; 166 167 FOR_EACH_SM(__get_cur_stree(), sm) { 168 if (sm->owner == USHRT_MAX) 169 continue; 170 if (use_states[sm->owner]) 171 count++; 172 } END_FOR_EACH_SM(sm); 173 return count; 174 } 175 176 void db_ignore_states(int id) 177 { 178 use_states[id] = 0; 179 } 180 181 void sql_insert_return_states(int return_id, const char *return_ranges, 182 int type, int param, const char *key, const char *value) 183 { 184 if (key && strlen(key) >= 80) 185 return; 186 return_ranges = replace_return_ranges(return_ranges); 187 sql_insert(return_states, "'%s', '%s', %lu, %d, '%s', %d, %d, %d, '%s', '%s'", 188 get_base_file(), get_function(), (unsigned long)__inline_fn, 189 return_id, return_ranges, fn_static(), type, param, key, value); 190 } 191 192 static struct string_list *common_funcs; 193 static int is_common_function(const char *fn) 194 { 195 char *tmp; 196 197 if (!fn) 198 return 0; 199 200 if (strncmp(fn, "__builtin_", 10) == 0) 201 return 1; 202 203 FOR_EACH_PTR(common_funcs, tmp) { 204 if (strcmp(tmp, fn) == 0) 205 return 1; 206 } END_FOR_EACH_PTR(tmp); 207 208 return 0; 209 } 210 211 static char *function_signature(void) 212 { 213 return type_to_str(get_real_base_type(cur_func_sym)); 214 } 215 216 void sql_insert_caller_info(struct expression *call, int type, 217 int param, const char *key, const char *value) 218 { 219 FILE *tmp_fd = sm_outfd; 220 char *fn; 221 222 if (!option_info && !__inline_call) 223 return; 224 225 if (key && strlen(key) >= 80) 226 return; 227 228 fn = get_fnptr_name(call->fn); 229 if (!fn) 230 return; 231 232 if (__inline_call) { 233 mem_sql(NULL, NULL, 234 "insert into caller_info values ('%s', '%s', '%s', %lu, %d, %d, %d, '%s', '%s');", 235 get_base_file(), get_function(), fn, (unsigned long)call, 236 is_static(call->fn), type, param, key, value); 237 } 238 239 if (!option_info) 240 return; 241 242 if (strncmp(fn, "__builtin_", 10) == 0) 243 return; 244 if (type != INTERNAL && is_common_function(fn)) 245 return; 246 247 sm_outfd = caller_info_fd; 248 sm_msg("SQL_caller_info: insert into caller_info values (" 249 "'%s', '%s', '%s', %%CALL_ID%%, %d, %d, %d, '%s', '%s');", 250 get_base_file(), get_function(), fn, is_static(call->fn), 251 type, param, key, value); 252 sm_outfd = tmp_fd; 253 254 free_string(fn); 255 } 256 257 void sql_insert_function_ptr(const char *fn, const char *struct_name) 258 { 259 sql_insert_or_ignore(function_ptr, "'%s', '%s', '%s', 0", 260 get_base_file(), fn, struct_name); 261 } 262 263 void sql_insert_return_implies(int type, int param, const char *key, const char *value) 264 { 265 sql_insert_or_ignore(return_implies, "'%s', '%s', %lu, %d, %d, %d, '%s', '%s'", 266 get_base_file(), get_function(), (unsigned long)__inline_fn, 267 fn_static(), type, param, key, value); 268 } 269 270 void sql_insert_call_implies(int type, int param, const char *key, const char *value) 271 { 272 sql_insert_or_ignore(call_implies, "'%s', '%s', %lu, %d, %d, %d, '%s', '%s'", 273 get_base_file(), get_function(), (unsigned long)__inline_fn, 274 fn_static(), type, param, key, value); 275 } 276 277 void sql_insert_function_type_size(const char *member, const char *ranges) 278 { 279 sql_insert(function_type_size, "'%s', '%s', '%s', '%s'", get_base_file(), get_function(), member, ranges); 280 } 281 282 void sql_insert_function_type_info(int type, const char *struct_type, const char *member, const char *value) 283 { 284 sql_insert(function_type_info, "'%s', '%s', %d, '%s', '%s', '%s'", get_base_file(), get_function(), type, struct_type, member, value); 285 } 286 287 void sql_insert_type_info(int type, const char *member, const char *value) 288 { 289 sql_insert_cache(type_info, "'%s', %d, '%s', '%s'", get_base_file(), type, member, value); 290 } 291 292 void sql_insert_local_values(const char *name, const char *value) 293 { 294 sql_insert(local_values, "'%s', '%s', '%s'", get_base_file(), name, value); 295 } 296 297 void sql_insert_function_type_value(const char *type, const char *value) 298 { 299 sql_insert(function_type_value, "'%s', '%s', '%s', '%s'", get_base_file(), get_function(), type, value); 300 } 301 302 void sql_insert_function_type(int param, const char *value) 303 { 304 sql_insert(function_type, "'%s', '%s', %d, %d, '%s'", 305 get_base_file(), get_function(), fn_static(), param, value); 306 } 307 308 void sql_insert_parameter_name(int param, const char *value) 309 { 310 sql_insert(parameter_name, "'%s', '%s', %d, %d, '%s'", 311 get_base_file(), get_function(), fn_static(), param, value); 312 } 313 314 void sql_insert_data_info(struct expression *data, int type, const char *value) 315 { 316 char *data_name; 317 318 data_name = get_data_info_name(data); 319 if (!data_name) 320 return; 321 sql_insert(data_info, "'%s', '%s', %d, '%s'", 322 is_static(data) ? get_base_file() : "extern", 323 data_name, type, value); 324 } 325 326 void sql_insert_data_info_var_sym(const char *var, struct symbol *sym, int type, const char *value) 327 { 328 sql_insert(data_info, "'%s', '%s', %d, '%s'", 329 (sym->ctype.modifiers & MOD_STATIC) ? get_base_file() : "extern", 330 var, type, value); 331 } 332 333 void sql_save_constraint(const char *con) 334 { 335 if (!option_info) 336 return; 337 338 sm_msg("SQL: insert or ignore into constraints (str) values('%s');", escape_newlines(con)); 339 } 340 341 void sql_save_constraint_required(const char *data, int op, const char *limit) 342 { 343 sql_insert_or_ignore(constraints_required, "'%s', '%s', '%s'", data, show_special(op), limit); 344 } 345 346 void sql_copy_constraint_required(const char *new_limit, const char *old_limit) 347 { 348 if (!option_info) 349 return; 350 351 sm_msg("SQL_late: insert or ignore into constraints_required (data, op, bound) " 352 "select constraints_required.data, constraints_required.op, '%s' from " 353 "constraints_required where bound = '%s';", new_limit, old_limit); 354 } 355 356 void sql_insert_fn_ptr_data_link(const char *ptr, const char *data) 357 { 358 sql_insert_or_ignore(fn_ptr_data_link, "'%s', '%s'", ptr, data); 359 } 360 361 void sql_insert_fn_data_link(struct expression *fn, int type, int param, const char *key, const char *value) 362 { 363 if (fn->type != EXPR_SYMBOL || !fn->symbol->ident) 364 return; 365 366 sql_insert(fn_data_link, "'%s', '%s', %d, %d, %d, '%s', '%s'", 367 (fn->symbol->ctype.modifiers & MOD_STATIC) ? get_base_file() : "extern", 368 fn->symbol->ident->name, 369 !!(fn->symbol->ctype.modifiers & MOD_STATIC), 370 type, param, key, value); 371 } 372 373 void sql_insert_mtag_about(mtag_t tag, const char *left_name, const char *right_name) 374 { 375 sql_insert(mtag_about, "%lld, '%s', '%s', %d, '%s', '%s'", 376 tag, get_filename(), get_function(), get_lineno(), left_name, right_name); 377 } 378 379 void sql_insert_mtag_map(mtag_t tag, int offset, mtag_t container) 380 { 381 sql_insert(mtag_map, "%lld, %d, %lld", tag, offset, container); 382 } 383 384 void sql_insert_mtag_alias(mtag_t orig, mtag_t alias) 385 { 386 sql_insert(mtag_alias, "%lld, %lld", orig, alias); 387 } 388 389 static int save_mtag(void *_tag, int argc, char **argv, char **azColName) 390 { 391 mtag_t *saved_tag = _tag; 392 mtag_t new_tag; 393 394 new_tag = strtoll(argv[0], NULL, 10); 395 396 if (!*saved_tag) 397 *saved_tag = new_tag; 398 else if (*saved_tag != new_tag) 399 *saved_tag = -1ULL; 400 401 return 0; 402 } 403 404 int mtag_map_select_container(mtag_t tag, int offset, mtag_t *container) 405 { 406 mtag_t tmp = 0; 407 408 run_sql(save_mtag, &tmp, 409 "select container from mtag_map where tag = %lld and offset = %d;", 410 tag, offset); 411 412 if (tmp == 0 || tmp == -1ULL) 413 return 0; 414 *container = tmp; 415 return 1; 416 } 417 418 int mtag_map_select_tag(mtag_t container, int offset, mtag_t *tag) 419 { 420 mtag_t tmp = 0; 421 422 run_sql(save_mtag, &tmp, 423 "select tag from mtag_map where container = %lld and offset = %d;", 424 container, offset); 425 426 if (tmp == 0 || tmp == -1ULL) 427 return 0; 428 *tag = tmp; 429 return 1; 430 } 431 432 char *get_static_filter(struct symbol *sym) 433 { 434 static char sql_filter[1024]; 435 436 /* This can only happen on buggy code. Return invalid SQL. */ 437 if (!sym) { 438 sql_filter[0] = '\0'; 439 return sql_filter; 440 } 441 442 if (sym->ctype.modifiers & MOD_STATIC) { 443 snprintf(sql_filter, sizeof(sql_filter), 444 "file = '%s' and function = '%s' and static = '1'", 445 get_base_file(), sym->ident->name); 446 } else { 447 snprintf(sql_filter, sizeof(sql_filter), 448 "function = '%s' and static = '0'", sym->ident->name); 449 } 450 451 return sql_filter; 452 } 453 454 static int get_row_count(void *_row_count, int argc, char **argv, char **azColName) 455 { 456 int *row_count = _row_count; 457 458 *row_count = 0; 459 if (argc != 1) 460 return 0; 461 *row_count = atoi(argv[0]); 462 return 0; 463 } 464 465 static void mark_call_params_untracked(struct expression *call) 466 { 467 struct expression *arg; 468 int i = 0; 469 470 FOR_EACH_PTR(call->args, arg) { 471 mark_untracked(call, i++, "$", NULL); 472 } END_FOR_EACH_PTR(arg); 473 } 474 475 static void sql_select_return_states_pointer(const char *cols, 476 struct expression *call, int (*callback)(void*, int, char**, char**), void *info) 477 { 478 char *ptr; 479 int return_count = 0; 480 481 ptr = get_fnptr_name(call->fn); 482 if (!ptr) 483 return; 484 485 run_sql(get_row_count, &return_count, 486 "select count(*) from return_states join function_ptr " 487 "where return_states.function == function_ptr.function and " 488 "ptr = '%s' and searchable = 1 and type = %d;", ptr, INTERNAL); 489 /* The magic number 100 is just from testing on the kernel. */ 490 if (return_count > 100) { 491 mark_call_params_untracked(call); 492 return; 493 } 494 495 run_sql(callback, info, 496 "select %s from return_states join function_ptr where " 497 "return_states.function == function_ptr.function and ptr = '%s' " 498 "and searchable = 1 " 499 "order by function_ptr.file, return_states.file, return_id, type;", 500 cols, ptr); 501 } 502 503 static int is_local_symbol(struct expression *expr) 504 { 505 if (expr->type != EXPR_SYMBOL) 506 return 0; 507 if (expr->symbol->ctype.modifiers & (MOD_NONLOCAL | MOD_STATIC | MOD_ADDRESSABLE)) 508 return 0; 509 return 1; 510 } 511 512 void sql_select_return_states(const char *cols, struct expression *call, 513 int (*callback)(void*, int, char**, char**), void *info) 514 { 515 struct expression *fn; 516 int row_count = 0; 517 518 if (is_fake_call(call)) 519 return; 520 521 fn = strip_expr(call->fn); 522 if (fn->type != EXPR_SYMBOL || !fn->symbol || is_local_symbol(fn)) { 523 sql_select_return_states_pointer(cols, call, callback, info); 524 return; 525 } 526 527 if (inlinable(fn)) { 528 mem_sql(callback, info, 529 "select %s from return_states where call_id = '%lu' order by return_id, type;", 530 cols, (unsigned long)call); 531 return; 532 } 533 534 run_sql(get_row_count, &row_count, "select count(*) from return_states where %s;", 535 get_static_filter(fn->symbol)); 536 if (row_count > 3000) 537 return; 538 539 run_sql(callback, info, "select %s from return_states where %s order by file, return_id, type;", 540 cols, get_static_filter(fn->symbol)); 541 } 542 543 #define CALL_IMPLIES 0 544 #define RETURN_IMPLIES 1 545 546 struct implies_info { 547 int type; 548 struct db_implies_cb_list *cb_list; 549 struct expression *expr; 550 struct symbol *sym; 551 }; 552 553 void sql_select_implies(const char *cols, struct implies_info *info, 554 int (*callback)(void*, int, char**, char**)) 555 { 556 if (info->type == RETURN_IMPLIES && inlinable(info->expr->fn)) { 557 mem_sql(callback, info, 558 "select %s from return_implies where call_id = '%lu';", 559 cols, (unsigned long)info->expr); 560 return; 561 } 562 563 run_sql(callback, info, "select %s from %s_implies where %s;", 564 cols, 565 info->type == CALL_IMPLIES ? "call" : "return", 566 get_static_filter(info->sym)); 567 } 568 569 struct select_caller_info_data { 570 struct stree *final_states; 571 struct timeval start_time; 572 int prev_func_id; 573 int ignore; 574 int results; 575 }; 576 577 static int caller_info_callback(void *_data, int argc, char **argv, char **azColName); 578 579 static void sql_select_caller_info(struct select_caller_info_data *data, 580 const char *cols, struct symbol *sym) 581 { 582 if (__inline_fn) { 583 mem_sql(caller_info_callback, data, 584 "select %s from caller_info where call_id = %lu;", 585 cols, (unsigned long)__inline_fn); 586 return; 587 } 588 589 if (sym->ident->name && is_common_function(sym->ident->name)) 590 return; 591 run_sql(caller_info_callback, data, 592 "select %s from common_caller_info where %s order by call_id;", 593 cols, get_static_filter(sym)); 594 if (data->results) 595 return; 596 597 run_sql(caller_info_callback, data, 598 "select %s from caller_info where %s order by call_id;", 599 cols, get_static_filter(sym)); 600 } 601 602 void select_caller_info_hook(void (*callback)(const char *name, struct symbol *sym, char *key, char *value), int type) 603 { 604 struct def_callback *def_callback = __alloc_def_callback(0); 605 606 def_callback->hook_type = type; 607 def_callback->callback = callback; 608 add_ptr_list(&select_caller_info_callbacks, def_callback); 609 } 610 611 /* 612 * These call backs are used when the --info option is turned on to print struct 613 * member information. For example foo->bar could have a state in 614 * smatch_extra.c and also check_user.c. 615 */ 616 void add_member_info_callback(int owner, void (*callback)(struct expression *call, int param, char *printed_name, struct sm_state *sm)) 617 { 618 struct member_info_callback *member_callback = __alloc_member_info_callback(0); 619 620 member_callback->owner = owner; 621 member_callback->callback = callback; 622 add_ptr_list(&member_callbacks, member_callback); 623 } 624 625 void add_split_return_callback(void (*fn)(int return_id, char *return_ranges, struct expression *returned_expr)) 626 { 627 struct returned_state_callback *callback = __alloc_returned_state_callback(0); 628 629 callback->callback = fn; 630 add_ptr_list(&returned_state_callbacks, callback); 631 } 632 633 void add_returned_member_callback(int owner, void (*callback)(int return_id, char *return_ranges, struct expression *expr, char *printed_name, struct smatch_state *state)) 634 { 635 struct returned_member_callback *member_callback = __alloc_returned_member_callback(0); 636 637 member_callback->owner = owner; 638 member_callback->callback = callback; 639 add_ptr_list(&returned_member_callbacks, member_callback); 640 } 641 642 void select_call_implies_hook(int type, void (*callback)(struct expression *call, struct expression *arg, char *key, char *value)) 643 { 644 struct db_implies_callback *cb = __alloc_db_implies_callback(0); 645 646 cb->type = type; 647 cb->callback = callback; 648 add_ptr_list(&call_implies_cb_list, cb); 649 } 650 651 void select_return_implies_hook(int type, void (*callback)(struct expression *call, struct expression *arg, char *key, char *value)) 652 { 653 struct db_implies_callback *cb = __alloc_db_implies_callback(0); 654 655 cb->type = type; 656 cb->callback = callback; 657 add_ptr_list(&return_implies_cb_list, cb); 658 } 659 660 struct return_info { 661 struct expression *static_returns_call; 662 struct symbol *return_type; 663 struct range_list *return_range_list; 664 }; 665 666 static int db_return_callback(void *_ret_info, int argc, char **argv, char **azColName) 667 { 668 struct return_info *ret_info = _ret_info; 669 struct range_list *rl; 670 struct expression *call_expr = ret_info->static_returns_call; 671 672 if (argc != 1) 673 return 0; 674 call_results_to_rl(call_expr, ret_info->return_type, argv[0], &rl); 675 ret_info->return_range_list = rl_union(ret_info->return_range_list, rl); 676 return 0; 677 } 678 679 struct range_list *db_return_vals(struct expression *expr) 680 { 681 struct return_info ret_info = {}; 682 char buf[64]; 683 struct sm_state *sm; 684 685 if (is_fake_call(expr)) 686 return NULL; 687 688 snprintf(buf, sizeof(buf), "return %p", expr); 689 sm = get_sm_state(SMATCH_EXTRA, buf, NULL); 690 if (sm) 691 return clone_rl(estate_rl(sm->state)); 692 ret_info.static_returns_call = expr; 693 ret_info.return_type = get_type(expr); 694 if (!ret_info.return_type) 695 return NULL; 696 697 if (expr->fn->type != EXPR_SYMBOL || !expr->fn->symbol) 698 return NULL; 699 700 ret_info.return_range_list = NULL; 701 if (inlinable(expr->fn)) { 702 mem_sql(db_return_callback, &ret_info, 703 "select distinct return from return_states where call_id = '%lu';", 704 (unsigned long)expr); 705 } else { 706 run_sql(db_return_callback, &ret_info, 707 "select distinct return from return_states where %s;", 708 get_static_filter(expr->fn->symbol)); 709 } 710 return ret_info.return_range_list; 711 } 712 713 struct range_list *db_return_vals_from_str(const char *fn_name) 714 { 715 struct return_info ret_info; 716 717 ret_info.static_returns_call = NULL; 718 ret_info.return_type = &llong_ctype; 719 ret_info.return_range_list = NULL; 720 721 run_sql(db_return_callback, &ret_info, 722 "select distinct return from return_states where function = '%s';", 723 fn_name); 724 return ret_info.return_range_list; 725 } 726 727 /* 728 * This is used when we have a function that takes a function pointer as a 729 * parameter. "frob(blah, blah, my_function);" We know that the return values 730 * from frob() come from my_funcion() so we want to find the possible returns 731 * of my_function(), but we don't know which arguments are passed to it. 732 * 733 */ 734 struct range_list *db_return_vals_no_args(struct expression *expr) 735 { 736 struct return_info ret_info = {}; 737 738 if (!expr || expr->type != EXPR_SYMBOL) 739 return NULL; 740 741 ret_info.static_returns_call = expr; 742 ret_info.return_type = get_type(expr); 743 ret_info.return_type = get_real_base_type(ret_info.return_type); 744 if (!ret_info.return_type) 745 return NULL; 746 747 run_sql(db_return_callback, &ret_info, 748 "select distinct return from return_states where %s;", 749 get_static_filter(expr->symbol)); 750 751 return ret_info.return_range_list; 752 } 753 754 static void match_call_marker(struct expression *expr) 755 { 756 struct symbol *type; 757 758 type = get_type(expr->fn); 759 if (type && type->type == SYM_PTR) 760 type = get_real_base_type(type); 761 762 /* 763 * we just want to record something in the database so that if we have 764 * two calls like: frob(4); frob(some_unkown); then on the receiving 765 * side we know that sometimes frob is called with unknown parameters. 766 */ 767 768 sql_insert_caller_info(expr, INTERNAL, -1, "%call_marker%", type_to_str(type)); 769 } 770 771 int is_recursive_member(const char *name) 772 { 773 char buf[256]; 774 const char *p, *next; 775 int size; 776 777 p = strchr(name, '>'); 778 if (!p) 779 return 0; 780 p++; 781 while (true) { 782 next = strchr(p, '>'); 783 if (!next) 784 return 0; 785 next++; 786 787 size = next - p; 788 if (size >= sizeof(buf)) 789 return 0; 790 memcpy(buf, p, size); 791 buf[size] = '\0'; 792 if (strstr(next, buf)) 793 return 1; 794 p = next; 795 } 796 } 797 798 char *sm_to_arg_name(struct expression *expr, struct sm_state *sm) 799 { 800 struct symbol *sym; 801 const char *sm_name; 802 char *name; 803 bool is_address = false; 804 bool add_star = false; 805 char buf[256]; 806 char *ret = NULL; 807 int len; 808 809 expr = strip_expr(expr); 810 if (!expr) 811 return NULL; 812 813 if (expr->type == EXPR_PREOP && expr->op == '&') { 814 expr = strip_expr(expr->unop); 815 is_address = true; 816 } 817 818 name = expr_to_var_sym(expr, &sym); 819 if (!name || !sym) 820 goto free; 821 if (sym != sm->sym) 822 goto free; 823 824 sm_name = sm->name; 825 add_star = false; 826 if (sm_name[0] == '*') { 827 add_star = true; 828 sm_name++; 829 } 830 831 len = strlen(name); 832 if (strncmp(name, sm_name, len) != 0) 833 goto free; 834 if (sm_name[len] == '\0') { 835 snprintf(buf, sizeof(buf), "%s%s$", 836 add_star ? "*" : "", is_address ? "*" : ""); 837 } else { 838 if (sm_name[len] != '.' && sm_name[len] != '-') 839 goto free; 840 if (sm_name[len] == '-') 841 len++; 842 // FIXME does is_address really imply that sm_name[len] == '-' 843 snprintf(buf, sizeof(buf), "%s$->%s", add_star ? "*" : "", 844 sm_name + len); 845 } 846 847 ret = alloc_sname(buf); 848 free: 849 free_string(name); 850 return ret; 851 } 852 853 static void print_struct_members(struct expression *call, struct expression *expr, int param, struct stree *stree, 854 void (*callback)(struct expression *call, int param, char *printed_name, struct sm_state *sm)) 855 { 856 struct sm_state *sm; 857 const char *sm_name; 858 char *name; 859 struct symbol *sym; 860 int len; 861 char printed_name[256]; 862 int is_address = 0; 863 bool add_star; 864 struct symbol *type; 865 866 expr = strip_expr(expr); 867 if (!expr) 868 return; 869 type = get_type(expr); 870 if (type && type_bits(type) < type_bits(&ulong_ctype)) 871 return; 872 873 if (expr->type == EXPR_PREOP && expr->op == '&') { 874 expr = strip_expr(expr->unop); 875 is_address = 1; 876 } 877 878 name = expr_to_var_sym(expr, &sym); 879 if (!name || !sym) 880 goto free; 881 882 len = strlen(name); 883 FOR_EACH_SM(stree, sm) { 884 if (sm->sym != sym) 885 continue; 886 sm_name = sm->name; 887 add_star = false; 888 if (sm_name[0] == '*') { 889 add_star = true; 890 sm_name++; 891 } 892 // FIXME: simplify? 893 if (!add_star && strcmp(name, sm_name) == 0) { 894 if (is_address) 895 snprintf(printed_name, sizeof(printed_name), "*$"); 896 else /* these are already handled. fixme: handle them here */ 897 continue; 898 } else if (add_star && strcmp(name, sm_name) == 0) { 899 snprintf(printed_name, sizeof(printed_name), "%s*$", 900 is_address ? "*" : ""); 901 } else if (strncmp(name, sm_name, len) == 0) { 902 if (sm_name[len] != '.' && sm_name[len] != '-') 903 continue; 904 if (is_address) 905 snprintf(printed_name, sizeof(printed_name), 906 "%s$->%s", add_star ? "*" : "", 907 sm_name + len + 1); 908 else 909 snprintf(printed_name, sizeof(printed_name), 910 "%s$%s", add_star ? "*" : "", 911 sm_name + len); 912 } else { 913 continue; 914 } 915 if (is_recursive_member(printed_name)) 916 continue; 917 callback(call, param, printed_name, sm); 918 } END_FOR_EACH_SM(sm); 919 free: 920 free_string(name); 921 } 922 923 static void match_call_info(struct expression *call) 924 { 925 struct member_info_callback *cb; 926 struct expression *arg; 927 struct stree *stree; 928 char *name; 929 int i; 930 931 name = get_fnptr_name(call->fn); 932 if (!name) 933 return; 934 935 FOR_EACH_PTR(member_callbacks, cb) { 936 stree = get_all_states_stree(cb->owner); 937 i = 0; 938 FOR_EACH_PTR(call->args, arg) { 939 print_struct_members(call, arg, i, stree, cb->callback); 940 i++; 941 } END_FOR_EACH_PTR(arg); 942 free_stree(&stree); 943 } END_FOR_EACH_PTR(cb); 944 945 free_string(name); 946 } 947 948 static int get_param(int param, char **name, struct symbol **sym) 949 { 950 struct symbol *arg; 951 int i; 952 953 i = 0; 954 FOR_EACH_PTR(cur_func_sym->ctype.base_type->arguments, arg) { 955 /* 956 * this is a temporary hack to work around a bug (I think in sparse?) 957 * 2.6.37-rc1:fs/reiserfs/journal.o 958 * If there is a function definition without parameter name found 959 * after a function implementation then it causes a crash. 960 * int foo() {} 961 * int bar(char *); 962 */ 963 if (arg->ident->name < (char *)100) 964 continue; 965 if (i == param) { 966 *name = arg->ident->name; 967 *sym = arg; 968 return TRUE; 969 } 970 i++; 971 } END_FOR_EACH_PTR(arg); 972 973 return FALSE; 974 } 975 976 static int function_signature_matches(const char *sig) 977 { 978 char *my_sig; 979 980 my_sig = function_signature(); 981 if (!sig || !my_sig) 982 return 1; /* default to matching */ 983 if (strcmp(my_sig, sig) == 0) 984 return 1; 985 return 0; 986 } 987 988 static int caller_info_callback(void *_data, int argc, char **argv, char **azColName) 989 { 990 struct select_caller_info_data *data = _data; 991 int func_id; 992 long type; 993 long param; 994 char *key; 995 char *value; 996 char *name = NULL; 997 struct symbol *sym = NULL; 998 struct def_callback *def_callback; 999 struct stree *stree; 1000 struct timeval cur_time; 1001 1002 data->results = 1; 1003 1004 if (argc != 5) 1005 return 0; 1006 1007 gettimeofday(&cur_time, NULL); 1008 if (cur_time.tv_sec - data->start_time.tv_sec > 10) 1009 return 0; 1010 1011 func_id = atoi(argv[0]); 1012 errno = 0; 1013 type = strtol(argv[1], NULL, 10); 1014 param = strtol(argv[2], NULL, 10); 1015 if (errno) 1016 return 0; 1017 key = argv[3]; 1018 value = argv[4]; 1019 1020 if (data->prev_func_id == -1) 1021 data->prev_func_id = func_id; 1022 if (func_id != data->prev_func_id) { 1023 stree = __pop_fake_cur_stree(); 1024 if (!data->ignore) 1025 merge_stree(&data->final_states, stree); 1026 free_stree(&stree); 1027 __push_fake_cur_stree(); 1028 __unnullify_path(); 1029 data->prev_func_id = func_id; 1030 data->ignore = 0; 1031 } 1032 1033 if (data->ignore) 1034 return 0; 1035 if (type == INTERNAL && 1036 !function_signature_matches(value)) { 1037 data->ignore = 1; 1038 return 0; 1039 } 1040 1041 if (param >= 0 && !get_param(param, &name, &sym)) 1042 return 0; 1043 1044 FOR_EACH_PTR(select_caller_info_callbacks, def_callback) { 1045 if (def_callback->hook_type == type) 1046 def_callback->callback(name, sym, key, value); 1047 } END_FOR_EACH_PTR(def_callback); 1048 1049 return 0; 1050 } 1051 1052 static struct string_list *ptr_names_done; 1053 static struct string_list *ptr_names; 1054 1055 static int get_ptr_name(void *unused, int argc, char **argv, char **azColName) 1056 { 1057 insert_string(&ptr_names, alloc_string(argv[0])); 1058 return 0; 1059 } 1060 1061 static char *get_next_ptr_name(void) 1062 { 1063 char *ptr; 1064 1065 FOR_EACH_PTR(ptr_names, ptr) { 1066 if (!insert_string(&ptr_names_done, ptr)) 1067 continue; 1068 return ptr; 1069 } END_FOR_EACH_PTR(ptr); 1070 return NULL; 1071 } 1072 1073 static void get_ptr_names(const char *file, const char *name) 1074 { 1075 char sql_filter[1024]; 1076 int before, after; 1077 1078 if (file) { 1079 snprintf(sql_filter, 1024, "file = '%s' and function = '%s';", 1080 file, name); 1081 } else { 1082 snprintf(sql_filter, 1024, "function = '%s';", name); 1083 } 1084 1085 before = ptr_list_size((struct ptr_list *)ptr_names); 1086 1087 run_sql(get_ptr_name, NULL, 1088 "select distinct ptr from function_ptr where %s", 1089 sql_filter); 1090 1091 after = ptr_list_size((struct ptr_list *)ptr_names); 1092 if (before == after) 1093 return; 1094 1095 while ((name = get_next_ptr_name())) 1096 get_ptr_names(NULL, name); 1097 } 1098 1099 static void match_data_from_db(struct symbol *sym) 1100 { 1101 struct select_caller_info_data data = { .prev_func_id = -1 }; 1102 struct sm_state *sm; 1103 struct stree *stree; 1104 struct timeval end_time; 1105 1106 if (!sym || !sym->ident) 1107 return; 1108 1109 gettimeofday(&data.start_time, NULL); 1110 1111 __push_fake_cur_stree(); 1112 __unnullify_path(); 1113 1114 if (!__inline_fn) { 1115 char *ptr; 1116 1117 if (sym->ctype.modifiers & MOD_STATIC) 1118 get_ptr_names(get_base_file(), sym->ident->name); 1119 else 1120 get_ptr_names(NULL, sym->ident->name); 1121 1122 if (ptr_list_size((struct ptr_list *)ptr_names) > 20) { 1123 __free_ptr_list((struct ptr_list **)&ptr_names); 1124 __free_ptr_list((struct ptr_list **)&ptr_names_done); 1125 __free_fake_cur_stree(); 1126 return; 1127 } 1128 1129 sql_select_caller_info(&data, 1130 "call_id, type, parameter, key, value", 1131 sym); 1132 1133 1134 stree = __pop_fake_cur_stree(); 1135 if (!data.ignore) 1136 merge_stree(&data.final_states, stree); 1137 free_stree(&stree); 1138 __push_fake_cur_stree(); 1139 __unnullify_path(); 1140 data.prev_func_id = -1; 1141 data.ignore = 0; 1142 data.results = 0; 1143 1144 FOR_EACH_PTR(ptr_names, ptr) { 1145 run_sql(caller_info_callback, &data, 1146 "select call_id, type, parameter, key, value" 1147 " from common_caller_info where function = '%s' order by call_id", 1148 ptr); 1149 } END_FOR_EACH_PTR(ptr); 1150 1151 if (data.results) { 1152 FOR_EACH_PTR(ptr_names, ptr) { 1153 free_string(ptr); 1154 } END_FOR_EACH_PTR(ptr); 1155 goto free_ptr_names; 1156 } 1157 1158 FOR_EACH_PTR(ptr_names, ptr) { 1159 run_sql(caller_info_callback, &data, 1160 "select call_id, type, parameter, key, value" 1161 " from caller_info where function = '%s' order by call_id", 1162 ptr); 1163 free_string(ptr); 1164 } END_FOR_EACH_PTR(ptr); 1165 1166 free_ptr_names: 1167 __free_ptr_list((struct ptr_list **)&ptr_names); 1168 __free_ptr_list((struct ptr_list **)&ptr_names_done); 1169 } else { 1170 sql_select_caller_info(&data, 1171 "call_id, type, parameter, key, value", 1172 sym); 1173 } 1174 1175 stree = __pop_fake_cur_stree(); 1176 if (!data.ignore) 1177 merge_stree(&data.final_states, stree); 1178 free_stree(&stree); 1179 1180 gettimeofday(&end_time, NULL); 1181 if (end_time.tv_sec - data.start_time.tv_sec <= 10) { 1182 FOR_EACH_SM(data.final_states, sm) { 1183 __set_sm(sm); 1184 } END_FOR_EACH_SM(sm); 1185 } 1186 1187 free_stree(&data.final_states); 1188 } 1189 1190 static int return_implies_callbacks(void *_info, int argc, char **argv, char **azColName) 1191 { 1192 struct implies_info *info = _info; 1193 struct db_implies_callback *cb; 1194 struct expression *arg = NULL; 1195 int type; 1196 int param; 1197 1198 if (argc != 5) 1199 return 0; 1200 1201 type = atoi(argv[1]); 1202 param = atoi(argv[2]); 1203 1204 FOR_EACH_PTR(info->cb_list, cb) { 1205 if (cb->type != type) 1206 continue; 1207 if (param != -1) { 1208 arg = get_argument_from_call_expr(info->expr->args, param); 1209 if (!arg) 1210 continue; 1211 } 1212 cb->callback(info->expr, arg, argv[3], argv[4]); 1213 } END_FOR_EACH_PTR(cb); 1214 1215 return 0; 1216 } 1217 1218 static int call_implies_callbacks(void *_info, int argc, char **argv, char **azColName) 1219 { 1220 struct implies_info *info = _info; 1221 struct db_implies_callback *cb; 1222 struct expression *arg; 1223 struct symbol *sym; 1224 char *name; 1225 int type; 1226 int param; 1227 1228 if (argc != 5) 1229 return 0; 1230 1231 type = atoi(argv[1]); 1232 param = atoi(argv[2]); 1233 1234 if (!get_param(param, &name, &sym)) 1235 return 0; 1236 arg = symbol_expression(sym); 1237 if (!arg) 1238 return 0; 1239 1240 FOR_EACH_PTR(info->cb_list, cb) { 1241 if (cb->type != type) 1242 continue; 1243 cb->callback(info->expr, arg, argv[3], argv[4]); 1244 } END_FOR_EACH_PTR(cb); 1245 1246 return 0; 1247 } 1248 1249 static void match_return_implies(struct expression *expr) 1250 { 1251 struct implies_info info = { 1252 .type = RETURN_IMPLIES, 1253 .cb_list = return_implies_cb_list, 1254 }; 1255 1256 if (expr->fn->type != EXPR_SYMBOL || 1257 !expr->fn->symbol) 1258 return; 1259 info.expr = expr; 1260 info.sym = expr->fn->symbol; 1261 sql_select_implies("function, type, parameter, key, value", &info, 1262 return_implies_callbacks); 1263 } 1264 1265 static void match_call_implies(struct symbol *sym) 1266 { 1267 struct implies_info info = { 1268 .type = CALL_IMPLIES, 1269 .cb_list = call_implies_cb_list, 1270 }; 1271 1272 if (!sym || !sym->ident) 1273 return; 1274 1275 info.sym = sym; 1276 sql_select_implies("function, type, parameter, key, value", &info, 1277 call_implies_callbacks); 1278 } 1279 1280 static char *get_fn_param_str(struct expression *expr) 1281 { 1282 struct expression *tmp; 1283 int param; 1284 char buf[32]; 1285 1286 tmp = get_assigned_expr(expr); 1287 if (tmp) 1288 expr = tmp; 1289 expr = strip_expr(expr); 1290 if (!expr || expr->type != EXPR_CALL) 1291 return NULL; 1292 expr = strip_expr(expr->fn); 1293 if (!expr || expr->type != EXPR_SYMBOL) 1294 return NULL; 1295 param = get_param_num(expr); 1296 if (param < 0) 1297 return NULL; 1298 1299 snprintf(buf, sizeof(buf), "[r $%d]", param); 1300 return alloc_sname(buf); 1301 } 1302 1303 static char *get_return_compare_is_param(struct expression *expr) 1304 { 1305 char *var; 1306 char buf[256]; 1307 int comparison; 1308 int param; 1309 1310 param = get_param_num(expr); 1311 if (param < 0) 1312 return NULL; 1313 1314 var = expr_to_var(expr); 1315 if (!var) 1316 return NULL; 1317 snprintf(buf, sizeof(buf), "%s orig", var); 1318 comparison = get_comparison_strings(var, buf); 1319 free_string(var); 1320 1321 if (!comparison) 1322 return NULL; 1323 1324 snprintf(buf, sizeof(buf), "[%s$%d]", show_special(comparison), param); 1325 return alloc_sname(buf); 1326 } 1327 1328 static char *get_return_compare_str(struct expression *expr) 1329 { 1330 char *compare_str; 1331 1332 compare_str = get_return_compare_is_param(expr); 1333 if (compare_str) 1334 return compare_str; 1335 1336 compare_str = expr_lte_to_param(expr, -1); 1337 if (compare_str) 1338 return compare_str; 1339 1340 return expr_param_comparison(expr, -1); 1341 } 1342 1343 static const char *get_return_ranges_str(struct expression *expr, struct range_list **rl_p) 1344 { 1345 struct range_list *rl; 1346 char *return_ranges; 1347 sval_t sval; 1348 char *fn_param_str; 1349 char *compare_str; 1350 char *math_str; 1351 char buf[128]; 1352 1353 *rl_p = NULL; 1354 1355 if (!expr) 1356 return alloc_sname(""); 1357 1358 if (get_implied_value(expr, &sval)) { 1359 sval = sval_cast(cur_func_return_type(), sval); 1360 *rl_p = alloc_rl(sval, sval); 1361 return sval_to_str_or_err_ptr(sval); 1362 } 1363 1364 fn_param_str = get_fn_param_str(expr); 1365 compare_str = expr_equal_to_param(expr, -1); 1366 math_str = get_value_in_terms_of_parameter_math(expr); 1367 1368 if (get_implied_rl(expr, &rl) && !is_whole_rl(rl)) { 1369 rl = cast_rl(cur_func_return_type(), rl); 1370 return_ranges = show_rl(rl); 1371 } else if (get_imaginary_absolute(expr, &rl)){ 1372 rl = cast_rl(cur_func_return_type(), rl); 1373 return alloc_sname(show_rl(rl)); 1374 } else { 1375 get_absolute_rl(expr, &rl); 1376 rl = cast_rl(cur_func_return_type(), rl); 1377 return_ranges = show_rl(rl); 1378 } 1379 *rl_p = rl; 1380 1381 if (fn_param_str) { 1382 snprintf(buf, sizeof(buf), "%s%s", return_ranges, fn_param_str); 1383 return alloc_sname(buf); 1384 } 1385 if (compare_str) { 1386 snprintf(buf, sizeof(buf), "%s%s", return_ranges, compare_str); 1387 return alloc_sname(buf); 1388 } 1389 if (math_str) { 1390 snprintf(buf, sizeof(buf), "%s[%s]", return_ranges, math_str); 1391 return alloc_sname(buf); 1392 } 1393 compare_str = get_return_compare_str(expr); 1394 if (compare_str) { 1395 snprintf(buf, sizeof(buf), "%s%s", return_ranges, compare_str); 1396 return alloc_sname(buf); 1397 } 1398 1399 return return_ranges; 1400 } 1401 1402 static void match_return_info(int return_id, char *return_ranges, struct expression *expr) 1403 { 1404 sql_insert_return_states(return_id, return_ranges, INTERNAL, -1, "", function_signature()); 1405 } 1406 1407 static bool call_return_state_hooks_conditional(struct expression *expr) 1408 { 1409 int final_pass_orig = final_pass; 1410 static int recurse; 1411 1412 if (recurse >= 2) 1413 return false; 1414 if (!expr || 1415 (expr->type != EXPR_CONDITIONAL && expr->type != EXPR_SELECT)) 1416 return false; 1417 1418 recurse++; 1419 1420 __push_fake_cur_stree(); 1421 1422 final_pass = 0; 1423 __split_whole_condition(expr->conditional); 1424 final_pass = final_pass_orig; 1425 1426 call_return_state_hooks(expr->cond_true ?: expr->conditional); 1427 1428 __push_true_states(); 1429 __use_false_states(); 1430 1431 call_return_state_hooks(expr->cond_false); 1432 1433 __merge_true_states(); 1434 __free_fake_cur_stree(); 1435 1436 recurse--; 1437 return true; 1438 } 1439 1440 static void call_return_state_hooks_compare(struct expression *expr) 1441 { 1442 struct returned_state_callback *cb; 1443 char *return_ranges; 1444 int final_pass_orig = final_pass; 1445 sval_t sval = { .type = &int_ctype }; 1446 sval_t ret; 1447 1448 if (!get_implied_value(expr, &ret)) 1449 ret.value = -1; 1450 1451 __push_fake_cur_stree(); 1452 1453 final_pass = 0; 1454 __split_whole_condition(expr); 1455 final_pass = final_pass_orig; 1456 1457 if (ret.value != 0) { 1458 return_ranges = alloc_sname("1"); 1459 sval.value = 1; 1460 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_sval(sval)); 1461 1462 return_id++; 1463 FOR_EACH_PTR(returned_state_callbacks, cb) { 1464 cb->callback(return_id, return_ranges, expr); 1465 } END_FOR_EACH_PTR(cb); 1466 } 1467 1468 __push_true_states(); 1469 __use_false_states(); 1470 1471 if (ret.value != 1) { 1472 return_ranges = alloc_sname("0"); 1473 sval.value = 0; 1474 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_sval(sval)); 1475 1476 return_id++; 1477 FOR_EACH_PTR(returned_state_callbacks, cb) { 1478 cb->callback(return_id, return_ranges, expr); 1479 } END_FOR_EACH_PTR(cb); 1480 } 1481 1482 __merge_true_states(); 1483 __free_fake_cur_stree(); 1484 } 1485 1486 static int ptr_in_list(struct sm_state *sm, struct state_list *slist) 1487 { 1488 struct sm_state *tmp; 1489 1490 FOR_EACH_PTR(slist, tmp) { 1491 if (strcmp(tmp->state->name, sm->state->name) == 0) 1492 return 1; 1493 } END_FOR_EACH_PTR(tmp); 1494 1495 return 0; 1496 } 1497 1498 static int split_possible_helper(struct sm_state *sm, struct expression *expr) 1499 { 1500 struct returned_state_callback *cb; 1501 struct range_list *rl; 1502 char *return_ranges; 1503 struct sm_state *tmp; 1504 int ret = 0; 1505 int nr_possible, nr_states; 1506 char *compare_str; 1507 char buf[128]; 1508 struct state_list *already_handled = NULL; 1509 sval_t sval; 1510 1511 if (!sm || !sm->merged) 1512 return 0; 1513 1514 if (too_many_possible(sm)) 1515 return 0; 1516 1517 /* bail if it gets too complicated */ 1518 nr_possible = 0; 1519 FOR_EACH_PTR(sm->possible, tmp) { 1520 if (tmp->merged) 1521 continue; 1522 if (ptr_in_list(tmp, already_handled)) 1523 continue; 1524 add_ptr_list(&already_handled, tmp); 1525 nr_possible++; 1526 } END_FOR_EACH_PTR(tmp); 1527 free_slist(&already_handled); 1528 nr_states = get_db_state_count(); 1529 if (nr_states * nr_possible >= 2000) 1530 return 0; 1531 1532 FOR_EACH_PTR(sm->possible, tmp) { 1533 if (tmp->merged) 1534 continue; 1535 if (ptr_in_list(tmp, already_handled)) 1536 continue; 1537 add_ptr_list(&already_handled, tmp); 1538 1539 ret = 1; 1540 __push_fake_cur_stree(); 1541 1542 overwrite_states_using_pool(sm, tmp); 1543 1544 rl = cast_rl(cur_func_return_type(), estate_rl(tmp->state)); 1545 return_ranges = show_rl(rl); 1546 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(clone_rl(rl))); 1547 if (!rl_to_sval(rl, &sval)) { 1548 compare_str = get_return_compare_str(expr); 1549 if (compare_str) { 1550 snprintf(buf, sizeof(buf), "%s%s", return_ranges, compare_str); 1551 return_ranges = alloc_sname(buf); 1552 } 1553 } 1554 1555 return_id++; 1556 FOR_EACH_PTR(returned_state_callbacks, cb) { 1557 cb->callback(return_id, return_ranges, expr); 1558 } END_FOR_EACH_PTR(cb); 1559 1560 __free_fake_cur_stree(); 1561 } END_FOR_EACH_PTR(tmp); 1562 1563 free_slist(&already_handled); 1564 1565 return ret; 1566 } 1567 1568 static int call_return_state_hooks_split_possible(struct expression *expr) 1569 { 1570 struct sm_state *sm; 1571 1572 if (!expr || expr_equal_to_param(expr, -1)) 1573 return 0; 1574 1575 sm = get_sm_state_expr(SMATCH_EXTRA, expr); 1576 return split_possible_helper(sm, expr); 1577 } 1578 1579 static bool has_possible_negative(struct sm_state *sm) 1580 { 1581 struct sm_state *tmp; 1582 1583 if (!type_signed(estate_type(sm->state))) 1584 return false; 1585 1586 FOR_EACH_PTR(sm->possible, tmp) { 1587 if (!estate_rl(tmp->state)) 1588 continue; 1589 if (sval_is_negative(estate_min(tmp->state)) && 1590 sval_is_negative(estate_max(tmp->state))) 1591 return true; 1592 } END_FOR_EACH_PTR(tmp); 1593 1594 return false; 1595 } 1596 1597 static bool has_separate_zero_null(struct sm_state *sm) 1598 { 1599 struct sm_state *tmp; 1600 sval_t sval; 1601 1602 FOR_EACH_PTR(sm->possible, tmp) { 1603 if (!estate_get_single_value(tmp->state, &sval)) 1604 continue; 1605 if (sval.value == 0) 1606 return true; 1607 } END_FOR_EACH_PTR(tmp); 1608 1609 return false; 1610 } 1611 1612 static int split_positive_from_negative(struct expression *expr) 1613 { 1614 struct sm_state *sm; 1615 struct returned_state_callback *cb; 1616 struct range_list *rl; 1617 const char *return_ranges; 1618 struct range_list *ret_rl; 1619 bool separate_zero; 1620 int undo; 1621 1622 /* We're going to print the states 3 times */ 1623 if (get_db_state_count() > 10000 / 3) 1624 return 0; 1625 1626 if (!get_implied_rl(expr, &rl) || !rl) 1627 return 0; 1628 /* Forget about INT_MAX and larger */ 1629 if (rl_max(rl).value <= 0) 1630 return 0; 1631 if (!sval_is_negative(rl_min(rl))) 1632 return 0; 1633 1634 sm = get_sm_state_expr(SMATCH_EXTRA, expr); 1635 if (!sm) 1636 return 0; 1637 if (!has_possible_negative(sm)) 1638 return 0; 1639 separate_zero = has_separate_zero_null(sm); 1640 1641 if (!assume(compare_expression(expr, separate_zero ? '>' : SPECIAL_GTE, zero_expr()))) 1642 return 0; 1643 1644 return_id++; 1645 return_ranges = get_return_ranges_str(expr, &ret_rl); 1646 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(ret_rl)); 1647 FOR_EACH_PTR(returned_state_callbacks, cb) { 1648 cb->callback(return_id, (char *)return_ranges, expr); 1649 } END_FOR_EACH_PTR(cb); 1650 1651 end_assume(); 1652 1653 if (separate_zero) { 1654 undo = assume(compare_expression(expr, SPECIAL_EQUAL, zero_expr())); 1655 1656 return_id++; 1657 return_ranges = get_return_ranges_str(expr, &ret_rl); 1658 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(ret_rl)); 1659 FOR_EACH_PTR(returned_state_callbacks, cb) { 1660 cb->callback(return_id, (char *)return_ranges, expr); 1661 } END_FOR_EACH_PTR(cb); 1662 1663 if (undo) 1664 end_assume(); 1665 } 1666 1667 undo = assume(compare_expression(expr, '<', zero_expr())); 1668 1669 return_id++; 1670 return_ranges = get_return_ranges_str(expr, &ret_rl); 1671 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(ret_rl)); 1672 FOR_EACH_PTR(returned_state_callbacks, cb) { 1673 cb->callback(return_id, (char *)return_ranges, expr); 1674 } END_FOR_EACH_PTR(cb); 1675 1676 if (undo) 1677 end_assume(); 1678 1679 return 1; 1680 } 1681 1682 static int call_return_state_hooks_split_null_non_null_zero(struct expression *expr) 1683 { 1684 struct returned_state_callback *cb; 1685 struct range_list *rl; 1686 struct range_list *nonnull_rl; 1687 sval_t null_sval; 1688 struct range_list *null_rl = NULL; 1689 char *return_ranges; 1690 struct sm_state *sm; 1691 struct smatch_state *state; 1692 int nr_states; 1693 int final_pass_orig = final_pass; 1694 1695 if (!expr || expr_equal_to_param(expr, -1)) 1696 return 0; 1697 if (expr->type == EXPR_CALL) 1698 return 0; 1699 1700 sm = get_sm_state_expr(SMATCH_EXTRA, expr); 1701 if (!sm) 1702 return 0; 1703 if (ptr_list_size((struct ptr_list *)sm->possible) == 1) 1704 return 0; 1705 state = sm->state; 1706 if (!estate_rl(state)) 1707 return 0; 1708 if (estate_min(state).value == 0 && estate_max(state).value == 0) 1709 return 0; 1710 if (!has_separate_zero_null(sm)) 1711 return 0; 1712 1713 nr_states = get_db_state_count(); 1714 if (option_info && nr_states >= 1500) 1715 return 0; 1716 1717 rl = estate_rl(state); 1718 1719 __push_fake_cur_stree(); 1720 1721 final_pass = 0; 1722 __split_whole_condition(expr); 1723 final_pass = final_pass_orig; 1724 1725 nonnull_rl = rl_filter(rl, rl_zero()); 1726 return_ranges = show_rl(nonnull_rl); 1727 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(nonnull_rl)); 1728 1729 return_id++; 1730 FOR_EACH_PTR(returned_state_callbacks, cb) { 1731 cb->callback(return_id, return_ranges, expr); 1732 } END_FOR_EACH_PTR(cb); 1733 1734 __push_true_states(); 1735 __use_false_states(); 1736 1737 return_ranges = alloc_sname("0"); 1738 null_sval = sval_type_val(rl_type(rl), 0); 1739 add_range(&null_rl, null_sval, null_sval); 1740 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(null_rl)); 1741 return_id++; 1742 FOR_EACH_PTR(returned_state_callbacks, cb) { 1743 cb->callback(return_id, return_ranges, expr); 1744 } END_FOR_EACH_PTR(cb); 1745 1746 __merge_true_states(); 1747 __free_fake_cur_stree(); 1748 1749 return 1; 1750 } 1751 1752 static bool is_kernel_success_fail(struct sm_state *sm) 1753 { 1754 struct sm_state *tmp; 1755 struct range_list *rl; 1756 bool has_zero = false; 1757 bool has_neg = false; 1758 1759 if (!type_signed(estate_type(sm->state))) 1760 return false; 1761 1762 FOR_EACH_PTR(sm->possible, tmp) { 1763 rl = estate_rl(tmp->state); 1764 if (!rl) 1765 return false; 1766 if (rl_min(rl).value == 0 && rl_max(rl).value == 0) { 1767 has_zero = true; 1768 continue; 1769 } 1770 has_neg = true; 1771 if (rl_min(rl).value >= -4095 && rl_max(rl).value < 0) 1772 continue; 1773 if (strcmp(tmp->state->name, "s32min-(-1)") == 0) 1774 continue; 1775 if (strcmp(tmp->state->name, "s32min-(-1),1-s32max") == 0) 1776 continue; 1777 return false; 1778 } END_FOR_EACH_PTR(tmp); 1779 1780 return has_zero && has_neg; 1781 } 1782 1783 static int call_return_state_hooks_split_success_fail(struct expression *expr) 1784 { 1785 struct sm_state *sm; 1786 struct range_list *rl; 1787 struct range_list *nonzero_rl; 1788 sval_t zero_sval; 1789 struct range_list *zero_rl = NULL; 1790 int nr_states; 1791 struct returned_state_callback *cb; 1792 char *return_ranges; 1793 int final_pass_orig = final_pass; 1794 1795 if (option_project != PROJ_KERNEL) 1796 return 0; 1797 1798 nr_states = get_db_state_count(); 1799 if (nr_states > 2000) 1800 return 0; 1801 1802 sm = get_sm_state_expr(SMATCH_EXTRA, expr); 1803 if (!sm) 1804 return 0; 1805 if (ptr_list_size((struct ptr_list *)sm->possible) == 1) 1806 return 0; 1807 if (!is_kernel_success_fail(sm)) 1808 return 0; 1809 1810 rl = estate_rl(sm->state); 1811 if (!rl) 1812 return 0; 1813 1814 __push_fake_cur_stree(); 1815 1816 final_pass = 0; 1817 __split_whole_condition(expr); 1818 final_pass = final_pass_orig; 1819 1820 nonzero_rl = rl_filter(rl, rl_zero()); 1821 nonzero_rl = cast_rl(cur_func_return_type(), nonzero_rl); 1822 return_ranges = show_rl(nonzero_rl); 1823 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(nonzero_rl)); 1824 1825 return_id++; 1826 FOR_EACH_PTR(returned_state_callbacks, cb) { 1827 cb->callback(return_id, return_ranges, expr); 1828 } END_FOR_EACH_PTR(cb); 1829 1830 __push_true_states(); 1831 __use_false_states(); 1832 1833 return_ranges = alloc_sname("0"); 1834 zero_sval = sval_type_val(rl_type(rl), 0); 1835 add_range(&zero_rl, zero_sval, zero_sval); 1836 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(zero_rl)); 1837 return_id++; 1838 FOR_EACH_PTR(returned_state_callbacks, cb) { 1839 cb->callback(return_id, return_ranges, expr); 1840 } END_FOR_EACH_PTR(cb); 1841 1842 __merge_true_states(); 1843 __free_fake_cur_stree(); 1844 1845 return 1; 1846 } 1847 1848 static int is_boolean(struct expression *expr) 1849 { 1850 struct range_list *rl; 1851 1852 if (!get_implied_rl(expr, &rl)) 1853 return 0; 1854 if (rl_min(rl).value == 0 && rl_max(rl).value == 1) 1855 return 1; 1856 return 0; 1857 } 1858 1859 static int splitable_function_call(struct expression *expr) 1860 { 1861 struct sm_state *sm; 1862 char buf[64]; 1863 1864 if (!expr || expr->type != EXPR_CALL) 1865 return 0; 1866 snprintf(buf, sizeof(buf), "return %p", expr); 1867 sm = get_sm_state(SMATCH_EXTRA, buf, NULL); 1868 return split_possible_helper(sm, expr); 1869 } 1870 1871 static struct sm_state *find_bool_param(void) 1872 { 1873 struct stree *start_states; 1874 struct symbol *arg; 1875 struct sm_state *sm, *tmp; 1876 sval_t sval; 1877 1878 start_states = get_start_states(); 1879 1880 FOR_EACH_PTR_REVERSE(cur_func_sym->ctype.base_type->arguments, arg) { 1881 if (!arg->ident) 1882 continue; 1883 sm = get_sm_state_stree(start_states, SMATCH_EXTRA, arg->ident->name, arg); 1884 if (!sm) 1885 continue; 1886 if (rl_min(estate_rl(sm->state)).value != 0 || 1887 rl_max(estate_rl(sm->state)).value != 1) 1888 continue; 1889 goto found; 1890 } END_FOR_EACH_PTR_REVERSE(arg); 1891 1892 return NULL; 1893 1894 found: 1895 /* 1896 * Check if it's splitable. If not, then splitting it up is likely not 1897 * useful for the callers. 1898 */ 1899 FOR_EACH_PTR(sm->possible, tmp) { 1900 if (is_merged(tmp)) 1901 continue; 1902 if (!estate_get_single_value(tmp->state, &sval)) 1903 return NULL; 1904 } END_FOR_EACH_PTR(tmp); 1905 1906 return sm; 1907 } 1908 1909 static int split_on_bool_sm(struct sm_state *sm, struct expression *expr) 1910 { 1911 struct returned_state_callback *cb; 1912 struct range_list *ret_rl; 1913 const char *return_ranges; 1914 struct sm_state *tmp; 1915 int ret = 0; 1916 struct state_list *already_handled = NULL; 1917 1918 if (!sm || !sm->merged) 1919 return 0; 1920 1921 if (too_many_possible(sm)) 1922 return 0; 1923 1924 FOR_EACH_PTR(sm->possible, tmp) { 1925 if (tmp->merged) 1926 continue; 1927 if (ptr_in_list(tmp, already_handled)) 1928 continue; 1929 add_ptr_list(&already_handled, tmp); 1930 1931 ret = 1; 1932 __push_fake_cur_stree(); 1933 1934 overwrite_states_using_pool(sm, tmp); 1935 1936 return_ranges = get_return_ranges_str(expr, &ret_rl); 1937 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(ret_rl)); 1938 return_id++; 1939 FOR_EACH_PTR(returned_state_callbacks, cb) { 1940 cb->callback(return_id, (char *)return_ranges, expr); 1941 } END_FOR_EACH_PTR(cb); 1942 1943 __free_fake_cur_stree(); 1944 } END_FOR_EACH_PTR(tmp); 1945 1946 free_slist(&already_handled); 1947 1948 return ret; 1949 } 1950 1951 static int split_by_bool_param(struct expression *expr) 1952 { 1953 struct sm_state *start_sm, *sm; 1954 sval_t sval; 1955 1956 start_sm = find_bool_param(); 1957 if (!start_sm) 1958 return 0; 1959 sm = get_sm_state(SMATCH_EXTRA, start_sm->name, start_sm->sym); 1960 if (!sm || estate_get_single_value(sm->state, &sval)) 1961 return 0; 1962 1963 if (get_db_state_count() * 2 >= 2000) 1964 return 0; 1965 1966 return split_on_bool_sm(sm, expr); 1967 } 1968 1969 static int split_by_null_nonnull_param(struct expression *expr) 1970 { 1971 struct symbol *arg; 1972 struct sm_state *sm; 1973 int nr_possible; 1974 1975 /* function must only take one pointer */ 1976 if (ptr_list_size((struct ptr_list *)cur_func_sym->ctype.base_type->arguments) != 1) 1977 return 0; 1978 arg = first_ptr_list((struct ptr_list *)cur_func_sym->ctype.base_type->arguments); 1979 if (!arg->ident) 1980 return 0; 1981 if (get_real_base_type(arg)->type != SYM_PTR) 1982 return 0; 1983 1984 if (param_was_set_var_sym(arg->ident->name, arg)) 1985 return 0; 1986 sm = get_sm_state(SMATCH_EXTRA, arg->ident->name, arg); 1987 if (!sm) 1988 return 0; 1989 1990 if (!has_separate_zero_null(sm)) 1991 return 0; 1992 1993 nr_possible = ptr_list_size((struct ptr_list *)sm->possible); 1994 if (get_db_state_count() * nr_possible >= 2000) 1995 return 0; 1996 1997 return split_on_bool_sm(sm, expr); 1998 } 1999 2000 struct expression *strip_expr_statement(struct expression *expr) 2001 { 2002 struct expression *orig = expr; 2003 struct statement *stmt, *last_stmt; 2004 2005 if (!expr) 2006 return NULL; 2007 if (expr->type == EXPR_PREOP && expr->op == '(') 2008 expr = expr->unop; 2009 if (expr->type != EXPR_STATEMENT) 2010 return orig; 2011 stmt = expr->statement; 2012 if (!stmt || stmt->type != STMT_COMPOUND) 2013 return orig; 2014 2015 last_stmt = last_ptr_list((struct ptr_list *)stmt->stmts); 2016 if (!last_stmt || last_stmt->type == STMT_LABEL) 2017 last_stmt = last_stmt->label_statement; 2018 if (!last_stmt || last_stmt->type != STMT_EXPRESSION) 2019 return orig; 2020 return strip_expr(last_stmt->expression); 2021 } 2022 2023 static void call_return_state_hooks(struct expression *expr) 2024 { 2025 struct returned_state_callback *cb; 2026 struct range_list *ret_rl; 2027 const char *return_ranges; 2028 int nr_states; 2029 sval_t sval; 2030 2031 if (__path_is_null()) 2032 return; 2033 2034 expr = strip_expr(expr); 2035 expr = strip_expr_statement(expr); 2036 2037 if (is_impossible_path()) 2038 goto vanilla; 2039 2040 if (expr && (expr->type == EXPR_COMPARE || 2041 !get_implied_value(expr, &sval)) && 2042 (is_condition(expr) || is_boolean(expr))) { 2043 call_return_state_hooks_compare(expr); 2044 return; 2045 } else if (call_return_state_hooks_conditional(expr)) { 2046 return; 2047 } else if (call_return_state_hooks_split_possible(expr)) { 2048 return; 2049 } else if (split_positive_from_negative(expr)) { 2050 return; 2051 } else if (call_return_state_hooks_split_null_non_null_zero(expr)) { 2052 return; 2053 } else if (call_return_state_hooks_split_success_fail(expr)) { 2054 return; 2055 } else if (splitable_function_call(expr)) { 2056 return; 2057 } else if (split_by_bool_param(expr)) { 2058 } else if (split_by_null_nonnull_param(expr)) { 2059 return; 2060 } 2061 2062 vanilla: 2063 return_ranges = get_return_ranges_str(expr, &ret_rl); 2064 set_state(RETURN_ID, "return_ranges", NULL, alloc_estate_rl(ret_rl)); 2065 2066 return_id++; 2067 nr_states = get_db_state_count(); 2068 if (nr_states >= 10000) { 2069 match_return_info(return_id, (char *)return_ranges, expr); 2070 print_limited_param_set(return_id, (char *)return_ranges, expr); 2071 mark_all_params_untracked(return_id, (char *)return_ranges, expr); 2072 return; 2073 } 2074 FOR_EACH_PTR(returned_state_callbacks, cb) { 2075 cb->callback(return_id, (char *)return_ranges, expr); 2076 } END_FOR_EACH_PTR(cb); 2077 } 2078 2079 static void print_returned_struct_members(int return_id, char *return_ranges, struct expression *expr) 2080 { 2081 struct returned_member_callback *cb; 2082 struct stree *stree; 2083 struct sm_state *sm; 2084 struct symbol *type; 2085 char *name; 2086 char member_name[256]; 2087 int len; 2088 2089 type = get_type(expr); 2090 if (!type || type->type != SYM_PTR) 2091 return; 2092 name = expr_to_var(expr); 2093 if (!name) 2094 return; 2095 2096 member_name[sizeof(member_name) - 1] = '\0'; 2097 strcpy(member_name, "$"); 2098 2099 len = strlen(name); 2100 FOR_EACH_PTR(returned_member_callbacks, cb) { 2101 stree = __get_cur_stree(); 2102 FOR_EACH_MY_SM(cb->owner, stree, sm) { 2103 if (sm->name[0] == '*' && strcmp(sm->name + 1, name) == 0) { 2104 strcpy(member_name, "*$"); 2105 cb->callback(return_id, return_ranges, expr, member_name, sm->state); 2106 continue; 2107 } 2108 if (strncmp(sm->name, name, len) != 0) 2109 continue; 2110 if (strncmp(sm->name + len, "->", 2) != 0) 2111 continue; 2112 snprintf(member_name, sizeof(member_name), "$%s", sm->name + len); 2113 cb->callback(return_id, return_ranges, expr, member_name, sm->state); 2114 } END_FOR_EACH_SM(sm); 2115 } END_FOR_EACH_PTR(cb); 2116 2117 free_string(name); 2118 } 2119 2120 static void reset_memdb(struct symbol *sym) 2121 { 2122 mem_sql(NULL, NULL, "delete from caller_info;"); 2123 mem_sql(NULL, NULL, "delete from return_states;"); 2124 mem_sql(NULL, NULL, "delete from call_implies;"); 2125 mem_sql(NULL, NULL, "delete from return_implies;"); 2126 } 2127 2128 static void match_end_func_info(struct symbol *sym) 2129 { 2130 if (__path_is_null()) 2131 return; 2132 call_return_state_hooks(NULL); 2133 } 2134 2135 static void match_after_func(struct symbol *sym) 2136 { 2137 if (!__inline_fn) 2138 reset_memdb(sym); 2139 } 2140 2141 static void init_memdb(void) 2142 { 2143 char *err = NULL; 2144 int rc; 2145 const char *schema_files[] = { 2146 "db/db.schema", 2147 "db/caller_info.schema", 2148 "db/common_caller_info.schema", 2149 "db/return_states.schema", 2150 "db/function_type_size.schema", 2151 "db/type_size.schema", 2152 "db/function_type_info.schema", 2153 "db/type_info.schema", 2154 "db/call_implies.schema", 2155 "db/return_implies.schema", 2156 "db/function_ptr.schema", 2157 "db/local_values.schema", 2158 "db/function_type_value.schema", 2159 "db/type_value.schema", 2160 "db/function_type.schema", 2161 "db/data_info.schema", 2162 "db/parameter_name.schema", 2163 "db/constraints.schema", 2164 "db/constraints_required.schema", 2165 "db/fn_ptr_data_link.schema", 2166 "db/fn_data_link.schema", 2167 "db/mtag_about.schema", 2168 "db/mtag_map.schema", 2169 "db/mtag_data.schema", 2170 "db/mtag_alias.schema", 2171 }; 2172 static char buf[4096]; 2173 int fd; 2174 int ret; 2175 int i; 2176 2177 rc = sqlite3_open(":memory:", &mem_db); 2178 if (rc != SQLITE_OK) { 2179 sm_ierror("starting In-Memory database."); 2180 return; 2181 } 2182 2183 for (i = 0; i < ARRAY_SIZE(schema_files); i++) { 2184 fd = open_schema_file(schema_files[i]); 2185 if (fd < 0) 2186 continue; 2187 ret = read(fd, buf, sizeof(buf)); 2188 if (ret < 0) { 2189 sm_ierror("failed to read: %s", schema_files[i]); 2190 continue; 2191 } 2192 close(fd); 2193 if (ret == sizeof(buf)) { 2194 sm_ierror("Schema file too large: %s (limit %zd bytes)", 2195 schema_files[i], sizeof(buf)); 2196 continue; 2197 } 2198 buf[ret] = '\0'; 2199 rc = sqlite3_exec(mem_db, buf, NULL, NULL, &err); 2200 if (rc != SQLITE_OK) { 2201 sm_ierror("SQL error #2: %s", err); 2202 sm_ierror("%s", buf); 2203 } 2204 } 2205 } 2206 2207 static void init_cachedb(void) 2208 { 2209 char *err = NULL; 2210 int rc; 2211 const char *schema_files[] = { 2212 "db/call_implies.schema", 2213 "db/return_implies.schema", 2214 "db/type_info.schema", 2215 "db/mtag_data.schema", 2216 "db/sink_info.schema", 2217 }; 2218 static char buf[4096]; 2219 int fd; 2220 int ret; 2221 int i; 2222 2223 rc = sqlite3_open(":memory:", &cache_db); 2224 if (rc != SQLITE_OK) { 2225 sm_ierror("starting In-Memory database."); 2226 return; 2227 } 2228 2229 for (i = 0; i < ARRAY_SIZE(schema_files); i++) { 2230 fd = open_schema_file(schema_files[i]); 2231 if (fd < 0) 2232 continue; 2233 ret = read(fd, buf, sizeof(buf)); 2234 if (ret < 0) { 2235 sm_ierror("failed to read: %s", schema_files[i]); 2236 continue; 2237 } 2238 close(fd); 2239 if (ret == sizeof(buf)) { 2240 sm_ierror("Schema file too large: %s (limit %zd bytes)", 2241 schema_files[i], sizeof(buf)); 2242 continue; 2243 } 2244 buf[ret] = '\0'; 2245 rc = sqlite3_exec(cache_db, buf, NULL, NULL, &err); 2246 if (rc != SQLITE_OK) { 2247 sm_ierror("SQL error #2: %s", err); 2248 sm_ierror("%s", buf); 2249 } 2250 } 2251 } 2252 2253 static int save_cache_data(void *_table, int argc, char **argv, char **azColName) 2254 { 2255 static char buf[4096]; 2256 char tmp[256]; 2257 char *p = buf; 2258 char *table = _table; 2259 int i; 2260 2261 2262 p += snprintf(p, 4096 - (p - buf), "insert or ignore into %s values (", table); 2263 for (i = 0; i < argc; i++) { 2264 if (i) 2265 p += snprintf(p, 4096 - (p - buf), ", "); 2266 sqlite3_snprintf(sizeof(tmp), tmp, "%q", escape_newlines(argv[i])); 2267 p += snprintf(p, 4096 - (p - buf), "'%s'", tmp); 2268 2269 } 2270 p += snprintf(p, 4096 - (p - buf), ");"); 2271 if (p - buf > 4096) 2272 return 0; 2273 2274 sm_msg("SQL: %s", buf); 2275 return 0; 2276 } 2277 2278 static void dump_cache(struct symbol_list *sym_list) 2279 { 2280 if (!option_info) 2281 return; 2282 cache_sql(&save_cache_data, (char *)"type_info", "select * from type_info;"); 2283 cache_sql(&save_cache_data, (char *)"return_implies", "select * from return_implies;"); 2284 cache_sql(&save_cache_data, (char *)"call_implies", "select * from call_implies;"); 2285 cache_sql(&save_cache_data, (char *)"mtag_data", "select * from mtag_data;"); 2286 cache_sql(&save_cache_data, (char *)"sink_info", "select * from sink_info;"); 2287 } 2288 2289 void open_smatch_db(char *db_file) 2290 { 2291 int rc; 2292 2293 if (option_no_db) 2294 return; 2295 2296 use_states = malloc(num_checks + 1); 2297 memset(use_states, 0xff, num_checks + 1); 2298 2299 init_memdb(); 2300 init_cachedb(); 2301 2302 rc = sqlite3_open_v2(db_file, &smatch_db, SQLITE_OPEN_READONLY, NULL); 2303 if (rc != SQLITE_OK) { 2304 option_no_db = 1; 2305 return; 2306 } 2307 run_sql(NULL, NULL, 2308 "PRAGMA cache_size = %d;", SQLITE_CACHE_PAGES); 2309 return; 2310 } 2311 2312 static void register_common_funcs(void) 2313 { 2314 struct token *token; 2315 char *func; 2316 char filename[256]; 2317 2318 if (option_project == PROJ_NONE) 2319 strcpy(filename, "common_functions"); 2320 else 2321 snprintf(filename, 256, "%s.common_functions", option_project_str); 2322 2323 token = get_tokens_file(filename); 2324 if (!token) 2325 return; 2326 if (token_type(token) != TOKEN_STREAMBEGIN) 2327 return; 2328 token = token->next; 2329 while (token_type(token) != TOKEN_STREAMEND) { 2330 if (token_type(token) != TOKEN_IDENT) 2331 return; 2332 func = alloc_string(show_ident(token->ident)); 2333 add_ptr_list(&common_funcs, func); 2334 token = token->next; 2335 } 2336 clear_token_alloc(); 2337 } 2338 2339 static char *get_next_string(char **str) 2340 { 2341 static char string[256]; 2342 char *start; 2343 char *p = *str; 2344 int len, i, j; 2345 2346 if (*p == '\0') 2347 return NULL; 2348 start = p; 2349 2350 while (*p != '\0' && *p != '\n') { 2351 if (*p == '\\' && *(p + 1) == ' ') { 2352 p += 2; 2353 continue; 2354 } 2355 if (*p == ' ') 2356 break; 2357 p++; 2358 } 2359 2360 len = p - start; 2361 if (len >= sizeof(string)) { 2362 memcpy(string, start, sizeof(string)); 2363 string[sizeof(string) - 1] = '\0'; 2364 sm_ierror("return_fix: '%s' too long", string); 2365 **str = '\0'; 2366 return NULL; 2367 } 2368 memcpy(string, start, len); 2369 string[len] = '\0'; 2370 for (i = 0; i < sizeof(string) - 1; i++) { 2371 if (string[i] == '\\' && string[i + 1] == ' ') { 2372 for (j = i; string[j] != '\0'; j++) 2373 string[j] = string[j + 1]; 2374 } 2375 } 2376 if (*p != '\0') 2377 p++; 2378 *str = p; 2379 return string; 2380 } 2381 2382 static void register_return_replacements(void) 2383 { 2384 char *func, *orig, *new; 2385 char filename[256]; 2386 char buf[4096]; 2387 int fd, ret, i; 2388 char *p; 2389 2390 snprintf(filename, 256, "db/%s.return_fixes", option_project_str); 2391 fd = open_schema_file(filename); 2392 if (fd < 0) 2393 return; 2394 ret = read(fd, buf, sizeof(buf)); 2395 close(fd); 2396 if (ret < 0) 2397 return; 2398 if (ret == sizeof(buf)) { 2399 sm_ierror("file too large: %s (limit %zd bytes)", 2400 filename, sizeof(buf)); 2401 return; 2402 } 2403 buf[ret] = '\0'; 2404 2405 p = buf; 2406 while (*p) { 2407 get_next_string(&p); 2408 replace_count++; 2409 } 2410 if (replace_count == 0 || replace_count % 3 != 0) { 2411 replace_count = 0; 2412 return; 2413 } 2414 replace_table = malloc(replace_count * sizeof(char *)); 2415 2416 p = buf; 2417 i = 0; 2418 while (*p) { 2419 func = alloc_string(get_next_string(&p)); 2420 orig = alloc_string(get_next_string(&p)); 2421 new = alloc_string(get_next_string(&p)); 2422 2423 replace_table[i++] = func; 2424 replace_table[i++] = orig; 2425 replace_table[i++] = new; 2426 } 2427 } 2428 2429 void register_definition_db_callbacks(int id) 2430 { 2431 add_hook(&match_call_info, FUNCTION_CALL_HOOK); 2432 add_split_return_callback(match_return_info); 2433 add_split_return_callback(print_returned_struct_members); 2434 add_hook(&call_return_state_hooks, RETURN_HOOK); 2435 add_hook(&match_end_func_info, END_FUNC_HOOK); 2436 add_hook(&match_after_func, AFTER_FUNC_HOOK); 2437 2438 add_hook(&match_data_from_db, FUNC_DEF_HOOK); 2439 add_hook(&match_call_implies, FUNC_DEF_HOOK); 2440 add_hook(&match_return_implies, CALL_HOOK_AFTER_INLINE); 2441 2442 register_common_funcs(); 2443 register_return_replacements(); 2444 2445 add_hook(&dump_cache, END_FILE_HOOK); 2446 } 2447 2448 void register_db_call_marker(int id) 2449 { 2450 add_hook(&match_call_marker, FUNCTION_CALL_HOOK); 2451 } 2452 2453 char *return_state_to_var_sym(struct expression *expr, int param, const char *key, struct symbol **sym) 2454 { 2455 struct expression *arg; 2456 char *name = NULL; 2457 char member_name[256]; 2458 2459 *sym = NULL; 2460 2461 if (param == -1) { 2462 const char *star = ""; 2463 2464 if (expr->type != EXPR_ASSIGNMENT) 2465 return NULL; 2466 if (get_type(expr->left) == &int_ctype && strcmp(key, "$") != 0) 2467 return NULL; 2468 name = expr_to_var_sym(expr->left, sym); 2469 if (!name) 2470 return NULL; 2471 if (key[0] == '*') { 2472 star = "*"; 2473 key++; 2474 } 2475 if (strncmp(key, "$", 1) != 0) 2476 return name; 2477 snprintf(member_name, sizeof(member_name), "%s%s%s", star, name, key + 1); 2478 free_string(name); 2479 return alloc_string(member_name); 2480 } 2481 2482 while (expr->type == EXPR_ASSIGNMENT) 2483 expr = strip_expr(expr->right); 2484 if (expr->type != EXPR_CALL) 2485 return NULL; 2486 2487 arg = get_argument_from_call_expr(expr->args, param); 2488 if (!arg) 2489 return NULL; 2490 2491 return get_variable_from_key(arg, key, sym); 2492 } 2493 2494 char *get_variable_from_key(struct expression *arg, const char *key, struct symbol **sym) 2495 { 2496 char buf[256]; 2497 char *tmp; 2498 int star_cnt = 0; 2499 2500 if (!arg) 2501 return NULL; 2502 2503 arg = strip_expr(arg); 2504 2505 if (strcmp(key, "$") == 0) 2506 return expr_to_var_sym(arg, sym); 2507 2508 if (strcmp(key, "*$") == 0) { 2509 if (arg->type == EXPR_PREOP && arg->op == '&') { 2510 arg = strip_expr(arg->unop); 2511 return expr_to_var_sym(arg, sym); 2512 } else { 2513 tmp = expr_to_var_sym(arg, sym); 2514 if (!tmp) 2515 return NULL; 2516 snprintf(buf, sizeof(buf), "*%s", tmp); 2517 free_string(tmp); 2518 return alloc_string(buf); 2519 } 2520 } 2521 2522 while (key[0] == '*') { 2523 star_cnt++; 2524 key++; 2525 } 2526 2527 if (arg->type == EXPR_PREOP && arg->op == '&' && star_cnt) { 2528 arg = strip_expr(arg->unop); 2529 star_cnt--; 2530 } 2531 2532 if (arg->type == EXPR_PREOP && arg->op == '&') { 2533 arg = strip_expr(arg->unop); 2534 tmp = expr_to_var_sym(arg, sym); 2535 if (!tmp) 2536 return NULL; 2537 snprintf(buf, sizeof(buf), "%.*s%s.%s", 2538 star_cnt, "**********", tmp, key + 3); 2539 return alloc_string(buf); 2540 } 2541 2542 tmp = expr_to_var_sym(arg, sym); 2543 if (!tmp) 2544 return NULL; 2545 snprintf(buf, sizeof(buf), "%.*s%s%s", star_cnt, "**********", tmp, key + 1); 2546 free_string(tmp); 2547 return alloc_string(buf); 2548 } 2549 2550 char *get_chunk_from_key(struct expression *arg, char *key, struct symbol **sym, struct var_sym_list **vsl) 2551 { 2552 *vsl = NULL; 2553 2554 if (strcmp("$", key) == 0) 2555 return expr_to_chunk_sym_vsl(arg, sym, vsl); 2556 return get_variable_from_key(arg, key, sym); 2557 } 2558 2559 const char *state_name_to_param_name(const char *state_name, const char *param_name) 2560 { 2561 int star_cnt = 0; 2562 int name_len; 2563 char buf[256]; 2564 2565 name_len = strlen(param_name); 2566 2567 while (state_name[0] == '*') { 2568 star_cnt++; 2569 state_name++; 2570 } 2571 2572 /* ten out of ten stars! */ 2573 if (star_cnt > 10) 2574 return NULL; 2575 2576 if (strcmp(state_name, param_name) == 0) { 2577 snprintf(buf, sizeof(buf), "%.*s$", star_cnt, "**********"); 2578 return alloc_sname(buf); 2579 } 2580 2581 if (state_name[name_len] == '-' && /* check for '-' from "->" */ 2582 strncmp(state_name, param_name, name_len) == 0) { 2583 snprintf(buf, sizeof(buf), "%.*s$%s", star_cnt, "**********", state_name + name_len); 2584 return alloc_sname(buf); 2585 } 2586 return NULL; 2587 } 2588 2589 const char *get_param_name_var_sym(const char *name, struct symbol *sym) 2590 { 2591 if (!sym || !sym->ident) 2592 return NULL; 2593 2594 return state_name_to_param_name(name, sym->ident->name); 2595 } 2596 2597 const char *get_mtag_name_var_sym(const char *state_name, struct symbol *sym) 2598 { 2599 struct symbol *type; 2600 const char *sym_name; 2601 int name_len; 2602 static char buf[256]; 2603 2604 /* 2605 * mtag_name is different from param_name because mtags can be a struct 2606 * instead of a struct pointer. But we want to treat it like a pointer 2607 * because really an mtag is a pointer. Or in other words, if you pass 2608 * a struct foo then you want to talk about foo.bar but with an mtag 2609 * you want to refer to it as foo->bar. 2610 * 2611 */ 2612 2613 if (!sym || !sym->ident) 2614 return NULL; 2615 2616 type = get_real_base_type(sym); 2617 if (type && type->type == SYM_BASETYPE) 2618 return "*$"; 2619 2620 sym_name = sym->ident->name; 2621 name_len = strlen(sym_name); 2622 2623 if (state_name[name_len] == '.' && /* check for '-' from "->" */ 2624 strncmp(state_name, sym_name, name_len) == 0) { 2625 snprintf(buf, sizeof(buf), "$->%s", state_name + name_len + 1); 2626 return buf; 2627 } 2628 2629 return state_name_to_param_name(state_name, sym_name); 2630 } 2631 2632 const char *get_mtag_name_expr(struct expression *expr) 2633 { 2634 char *name; 2635 struct symbol *sym; 2636 const char *ret = NULL; 2637 2638 name = expr_to_var_sym(expr, &sym); 2639 if (!name || !sym) 2640 goto free; 2641 2642 ret = get_mtag_name_var_sym(name, sym); 2643 free: 2644 free_string(name); 2645 return ret; 2646 } 2647 2648 const char *get_param_name(struct sm_state *sm) 2649 { 2650 return get_param_name_var_sym(sm->name, sm->sym); 2651 } 2652 2653 char *get_data_info_name(struct expression *expr) 2654 { 2655 struct symbol *sym; 2656 char *name; 2657 char buf[256]; 2658 char *ret = NULL; 2659 2660 expr = strip_expr(expr); 2661 name = get_member_name(expr); 2662 if (name) 2663 return name; 2664 name = expr_to_var_sym(expr, &sym); 2665 if (!name || !sym) 2666 goto free; 2667 if (!(sym->ctype.modifiers & MOD_TOPLEVEL)) 2668 goto free; 2669 if (sym->ctype.modifiers & MOD_STATIC) 2670 snprintf(buf, sizeof(buf), "static %s", name); 2671 else 2672 snprintf(buf, sizeof(buf), "global %s", name); 2673 ret = alloc_sname(buf); 2674 free: 2675 free_string(name); 2676 return ret; 2677 } 2678