1eda14cbcSMatt Macy /* 2eda14cbcSMatt Macy ** $Id: lstring.c,v 2.26.1.1 2013/04/12 18:48:47 roberto Exp $ 3eda14cbcSMatt Macy ** String table (keeps all strings handled by Lua) 4eda14cbcSMatt Macy ** See Copyright Notice in lua.h 5eda14cbcSMatt Macy */ 6eda14cbcSMatt Macy 7eda14cbcSMatt Macy 8eda14cbcSMatt Macy #define lstring_c 9eda14cbcSMatt Macy #define LUA_CORE 10eda14cbcSMatt Macy 11eda14cbcSMatt Macy #include <sys/lua/lua.h> 12eda14cbcSMatt Macy 13eda14cbcSMatt Macy #include "lmem.h" 14eda14cbcSMatt Macy #include "lobject.h" 15eda14cbcSMatt Macy #include "lstate.h" 16eda14cbcSMatt Macy #include "lstring.h" 17eda14cbcSMatt Macy 18eda14cbcSMatt Macy 19eda14cbcSMatt Macy /* 20eda14cbcSMatt Macy ** Lua will use at most ~(2^LUAI_HASHLIMIT) bytes from a string to 21eda14cbcSMatt Macy ** compute its hash 22eda14cbcSMatt Macy */ 23eda14cbcSMatt Macy #if !defined(LUAI_HASHLIMIT) 24eda14cbcSMatt Macy #define LUAI_HASHLIMIT 5 25eda14cbcSMatt Macy #endif 26eda14cbcSMatt Macy 27eda14cbcSMatt Macy 28eda14cbcSMatt Macy /* 29eda14cbcSMatt Macy ** equality for long strings 30eda14cbcSMatt Macy */ 31eda14cbcSMatt Macy int luaS_eqlngstr (TString *a, TString *b) { 32eda14cbcSMatt Macy size_t len = a->tsv.len; 33eda14cbcSMatt Macy lua_assert(a->tsv.tt == LUA_TLNGSTR && b->tsv.tt == LUA_TLNGSTR); 34eda14cbcSMatt Macy return (a == b) || /* same instance or... */ 35eda14cbcSMatt Macy ((len == b->tsv.len) && /* equal length and ... */ 36eda14cbcSMatt Macy (memcmp(getstr(a), getstr(b), len) == 0)); /* equal contents */ 37eda14cbcSMatt Macy } 38eda14cbcSMatt Macy 39eda14cbcSMatt Macy 40eda14cbcSMatt Macy /* 41eda14cbcSMatt Macy ** equality for strings 42eda14cbcSMatt Macy */ 43eda14cbcSMatt Macy int luaS_eqstr (TString *a, TString *b) { 44eda14cbcSMatt Macy return (a->tsv.tt == b->tsv.tt) && 45eda14cbcSMatt Macy (a->tsv.tt == LUA_TSHRSTR ? eqshrstr(a, b) : luaS_eqlngstr(a, b)); 46eda14cbcSMatt Macy } 47eda14cbcSMatt Macy 48eda14cbcSMatt Macy 49eda14cbcSMatt Macy unsigned int luaS_hash (const char *str, size_t l, unsigned int seed) { 50eda14cbcSMatt Macy unsigned int h = seed ^ cast(unsigned int, l); 51eda14cbcSMatt Macy size_t l1; 52eda14cbcSMatt Macy size_t step = (l >> LUAI_HASHLIMIT) + 1; 53eda14cbcSMatt Macy for (l1 = l; l1 >= step; l1 -= step) 54eda14cbcSMatt Macy h = h ^ ((h<<5) + (h>>2) + cast_byte(str[l1 - 1])); 55eda14cbcSMatt Macy return h; 56eda14cbcSMatt Macy } 57eda14cbcSMatt Macy 58eda14cbcSMatt Macy 59eda14cbcSMatt Macy /* 60eda14cbcSMatt Macy ** resizes the string table 61eda14cbcSMatt Macy */ 62eda14cbcSMatt Macy void luaS_resize (lua_State *L, int newsize) { 63eda14cbcSMatt Macy int i; 64eda14cbcSMatt Macy stringtable *tb = &G(L)->strt; 65eda14cbcSMatt Macy /* cannot resize while GC is traversing strings */ 66eda14cbcSMatt Macy luaC_runtilstate(L, ~bitmask(GCSsweepstring)); 67eda14cbcSMatt Macy if (newsize > tb->size) { 68eda14cbcSMatt Macy luaM_reallocvector(L, tb->hash, tb->size, newsize, GCObject *); 69eda14cbcSMatt Macy for (i = tb->size; i < newsize; i++) tb->hash[i] = NULL; 70eda14cbcSMatt Macy } 71eda14cbcSMatt Macy /* rehash */ 72eda14cbcSMatt Macy for (i=0; i<tb->size; i++) { 73eda14cbcSMatt Macy GCObject *p = tb->hash[i]; 74eda14cbcSMatt Macy tb->hash[i] = NULL; 75eda14cbcSMatt Macy while (p) { /* for each node in the list */ 76eda14cbcSMatt Macy GCObject *next = gch(p)->next; /* save next */ 77eda14cbcSMatt Macy unsigned int h = lmod(gco2ts(p)->hash, newsize); /* new position */ 78eda14cbcSMatt Macy gch(p)->next = tb->hash[h]; /* chain it */ 79eda14cbcSMatt Macy tb->hash[h] = p; 80eda14cbcSMatt Macy resetoldbit(p); /* see MOVE OLD rule */ 81eda14cbcSMatt Macy p = next; 82eda14cbcSMatt Macy } 83eda14cbcSMatt Macy } 84eda14cbcSMatt Macy if (newsize < tb->size) { 85eda14cbcSMatt Macy /* shrinking slice must be empty */ 86eda14cbcSMatt Macy lua_assert(tb->hash[newsize] == NULL && tb->hash[tb->size - 1] == NULL); 87eda14cbcSMatt Macy luaM_reallocvector(L, tb->hash, tb->size, newsize, GCObject *); 88eda14cbcSMatt Macy } 89eda14cbcSMatt Macy tb->size = newsize; 90eda14cbcSMatt Macy } 91eda14cbcSMatt Macy 92eda14cbcSMatt Macy 93eda14cbcSMatt Macy /* 94eda14cbcSMatt Macy ** creates a new string object 95eda14cbcSMatt Macy */ 96eda14cbcSMatt Macy static TString *createstrobj (lua_State *L, const char *str, size_t l, 97eda14cbcSMatt Macy int tag, unsigned int h, GCObject **list) { 98eda14cbcSMatt Macy TString *ts; 99eda14cbcSMatt Macy char *sbuf; 100eda14cbcSMatt Macy size_t totalsize; /* total size of TString object */ 101eda14cbcSMatt Macy totalsize = sizeof(TString) + ((l + 1) * sizeof(char)); 102eda14cbcSMatt Macy ts = &luaC_newobj(L, tag, totalsize, list, 0)->ts; 103eda14cbcSMatt Macy ts->tsv.len = l; 104eda14cbcSMatt Macy ts->tsv.hash = h; 105eda14cbcSMatt Macy ts->tsv.extra = 0; 106*7a7741afSMartin Matuska sbuf = ts->contents; 107eda14cbcSMatt Macy memcpy(sbuf, str, l*sizeof(char)); 108eda14cbcSMatt Macy sbuf[l] = '\0'; /* ending 0 */ 109eda14cbcSMatt Macy return ts; 110eda14cbcSMatt Macy } 111eda14cbcSMatt Macy 112eda14cbcSMatt Macy 113eda14cbcSMatt Macy /* 114eda14cbcSMatt Macy ** creates a new short string, inserting it into string table 115eda14cbcSMatt Macy */ 116eda14cbcSMatt Macy static TString *newshrstr (lua_State *L, const char *str, size_t l, 117eda14cbcSMatt Macy unsigned int h) { 118eda14cbcSMatt Macy GCObject **list; /* (pointer to) list where it will be inserted */ 119eda14cbcSMatt Macy stringtable *tb = &G(L)->strt; 120eda14cbcSMatt Macy TString *s; 121eda14cbcSMatt Macy if (tb->nuse >= cast(lu_int32, tb->size) && tb->size <= MAX_INT/2) 122eda14cbcSMatt Macy luaS_resize(L, tb->size*2); /* too crowded */ 123eda14cbcSMatt Macy list = &tb->hash[lmod(h, tb->size)]; 124eda14cbcSMatt Macy s = createstrobj(L, str, l, LUA_TSHRSTR, h, list); 125eda14cbcSMatt Macy tb->nuse++; 126eda14cbcSMatt Macy return s; 127eda14cbcSMatt Macy } 128eda14cbcSMatt Macy 129eda14cbcSMatt Macy 130eda14cbcSMatt Macy /* 131eda14cbcSMatt Macy ** checks whether short string exists and reuses it or creates a new one 132eda14cbcSMatt Macy */ 133eda14cbcSMatt Macy static TString *internshrstr (lua_State *L, const char *str, size_t l) { 134eda14cbcSMatt Macy GCObject *o; 135eda14cbcSMatt Macy global_State *g = G(L); 136eda14cbcSMatt Macy unsigned int h = luaS_hash(str, l, g->seed); 137eda14cbcSMatt Macy for (o = g->strt.hash[lmod(h, g->strt.size)]; 138eda14cbcSMatt Macy o != NULL; 139eda14cbcSMatt Macy o = gch(o)->next) { 140eda14cbcSMatt Macy TString *ts = rawgco2ts(o); 141eda14cbcSMatt Macy if (h == ts->tsv.hash && 142eda14cbcSMatt Macy l == ts->tsv.len && 143eda14cbcSMatt Macy (memcmp(str, getstr(ts), l * sizeof(char)) == 0)) { 144eda14cbcSMatt Macy if (isdead(G(L), o)) /* string is dead (but was not collected yet)? */ 145eda14cbcSMatt Macy changewhite(o); /* resurrect it */ 146eda14cbcSMatt Macy return ts; 147eda14cbcSMatt Macy } 148eda14cbcSMatt Macy } 149eda14cbcSMatt Macy return newshrstr(L, str, l, h); /* not found; create a new string */ 150eda14cbcSMatt Macy } 151eda14cbcSMatt Macy 152eda14cbcSMatt Macy 153eda14cbcSMatt Macy /* 154eda14cbcSMatt Macy ** new string (with explicit length) 155eda14cbcSMatt Macy */ 156eda14cbcSMatt Macy TString *luaS_newlstr (lua_State *L, const char *str, size_t l) { 157eda14cbcSMatt Macy if (l <= LUAI_MAXSHORTLEN) /* short string? */ 158eda14cbcSMatt Macy return internshrstr(L, str, l); 159eda14cbcSMatt Macy else { 160eda14cbcSMatt Macy if (l + 1 > (MAX_SIZET - sizeof(TString))/sizeof(char)) 161eda14cbcSMatt Macy luaM_toobig(L); 162eda14cbcSMatt Macy return createstrobj(L, str, l, LUA_TLNGSTR, G(L)->seed, NULL); 163eda14cbcSMatt Macy } 164eda14cbcSMatt Macy } 165eda14cbcSMatt Macy 166eda14cbcSMatt Macy 167eda14cbcSMatt Macy /* 168eda14cbcSMatt Macy ** new zero-terminated string 169eda14cbcSMatt Macy */ 170eda14cbcSMatt Macy TString *luaS_new (lua_State *L, const char *str) { 171eda14cbcSMatt Macy return luaS_newlstr(L, str, strlen(str)); 172eda14cbcSMatt Macy } 173eda14cbcSMatt Macy 174eda14cbcSMatt Macy 175eda14cbcSMatt Macy Udata *luaS_newudata (lua_State *L, size_t s, Table *e) { 176eda14cbcSMatt Macy Udata *u; 177eda14cbcSMatt Macy if (s > MAX_SIZET - sizeof(Udata)) 178eda14cbcSMatt Macy luaM_toobig(L); 179eda14cbcSMatt Macy u = &luaC_newobj(L, LUA_TUSERDATA, sizeof(Udata) + s, NULL, 0)->u; 180eda14cbcSMatt Macy u->uv.len = s; 181eda14cbcSMatt Macy u->uv.metatable = NULL; 182eda14cbcSMatt Macy u->uv.env = e; 183eda14cbcSMatt Macy return u; 184eda14cbcSMatt Macy } 185