1*61145dc2SMartin Matuska // SPDX-License-Identifier: MIT
2eda14cbcSMatt Macy /*
3eda14cbcSMatt Macy ** $Id: lstring.c,v 2.26.1.1 2013/04/12 18:48:47 roberto Exp $
4eda14cbcSMatt Macy ** String table (keeps all strings handled by Lua)
5eda14cbcSMatt Macy ** See Copyright Notice in lua.h
6eda14cbcSMatt Macy */
7eda14cbcSMatt Macy
8eda14cbcSMatt Macy
9eda14cbcSMatt Macy #define lstring_c
10eda14cbcSMatt Macy #define LUA_CORE
11eda14cbcSMatt Macy
12eda14cbcSMatt Macy #include <sys/lua/lua.h>
13eda14cbcSMatt Macy
14eda14cbcSMatt Macy #include "lmem.h"
15eda14cbcSMatt Macy #include "lobject.h"
16eda14cbcSMatt Macy #include "lstate.h"
17eda14cbcSMatt Macy #include "lstring.h"
18eda14cbcSMatt Macy
19eda14cbcSMatt Macy
20eda14cbcSMatt Macy /*
21eda14cbcSMatt Macy ** Lua will use at most ~(2^LUAI_HASHLIMIT) bytes from a string to
22eda14cbcSMatt Macy ** compute its hash
23eda14cbcSMatt Macy */
24eda14cbcSMatt Macy #if !defined(LUAI_HASHLIMIT)
25eda14cbcSMatt Macy #define LUAI_HASHLIMIT 5
26eda14cbcSMatt Macy #endif
27eda14cbcSMatt Macy
28eda14cbcSMatt Macy
29eda14cbcSMatt Macy /*
30eda14cbcSMatt Macy ** equality for long strings
31eda14cbcSMatt Macy */
luaS_eqlngstr(TString * a,TString * b)32eda14cbcSMatt Macy int luaS_eqlngstr (TString *a, TString *b) {
33eda14cbcSMatt Macy size_t len = a->tsv.len;
34eda14cbcSMatt Macy lua_assert(a->tsv.tt == LUA_TLNGSTR && b->tsv.tt == LUA_TLNGSTR);
35eda14cbcSMatt Macy return (a == b) || /* same instance or... */
36eda14cbcSMatt Macy ((len == b->tsv.len) && /* equal length and ... */
37eda14cbcSMatt Macy (memcmp(getstr(a), getstr(b), len) == 0)); /* equal contents */
38eda14cbcSMatt Macy }
39eda14cbcSMatt Macy
40eda14cbcSMatt Macy
41eda14cbcSMatt Macy /*
42eda14cbcSMatt Macy ** equality for strings
43eda14cbcSMatt Macy */
luaS_eqstr(TString * a,TString * b)44eda14cbcSMatt Macy int luaS_eqstr (TString *a, TString *b) {
45eda14cbcSMatt Macy return (a->tsv.tt == b->tsv.tt) &&
46eda14cbcSMatt Macy (a->tsv.tt == LUA_TSHRSTR ? eqshrstr(a, b) : luaS_eqlngstr(a, b));
47eda14cbcSMatt Macy }
48eda14cbcSMatt Macy
49eda14cbcSMatt Macy
luaS_hash(const char * str,size_t l,unsigned int seed)50eda14cbcSMatt Macy unsigned int luaS_hash (const char *str, size_t l, unsigned int seed) {
51eda14cbcSMatt Macy unsigned int h = seed ^ cast(unsigned int, l);
52eda14cbcSMatt Macy size_t l1;
53eda14cbcSMatt Macy size_t step = (l >> LUAI_HASHLIMIT) + 1;
54eda14cbcSMatt Macy for (l1 = l; l1 >= step; l1 -= step)
55eda14cbcSMatt Macy h = h ^ ((h<<5) + (h>>2) + cast_byte(str[l1 - 1]));
56eda14cbcSMatt Macy return h;
57eda14cbcSMatt Macy }
58eda14cbcSMatt Macy
59eda14cbcSMatt Macy
60eda14cbcSMatt Macy /*
61eda14cbcSMatt Macy ** resizes the string table
62eda14cbcSMatt Macy */
luaS_resize(lua_State * L,int newsize)63eda14cbcSMatt Macy void luaS_resize (lua_State *L, int newsize) {
64eda14cbcSMatt Macy int i;
65eda14cbcSMatt Macy stringtable *tb = &G(L)->strt;
66eda14cbcSMatt Macy /* cannot resize while GC is traversing strings */
67eda14cbcSMatt Macy luaC_runtilstate(L, ~bitmask(GCSsweepstring));
68eda14cbcSMatt Macy if (newsize > tb->size) {
69eda14cbcSMatt Macy luaM_reallocvector(L, tb->hash, tb->size, newsize, GCObject *);
70eda14cbcSMatt Macy for (i = tb->size; i < newsize; i++) tb->hash[i] = NULL;
71eda14cbcSMatt Macy }
72eda14cbcSMatt Macy /* rehash */
73eda14cbcSMatt Macy for (i=0; i<tb->size; i++) {
74eda14cbcSMatt Macy GCObject *p = tb->hash[i];
75eda14cbcSMatt Macy tb->hash[i] = NULL;
76eda14cbcSMatt Macy while (p) { /* for each node in the list */
77eda14cbcSMatt Macy GCObject *next = gch(p)->next; /* save next */
78eda14cbcSMatt Macy unsigned int h = lmod(gco2ts(p)->hash, newsize); /* new position */
79eda14cbcSMatt Macy gch(p)->next = tb->hash[h]; /* chain it */
80eda14cbcSMatt Macy tb->hash[h] = p;
81eda14cbcSMatt Macy resetoldbit(p); /* see MOVE OLD rule */
82eda14cbcSMatt Macy p = next;
83eda14cbcSMatt Macy }
84eda14cbcSMatt Macy }
85eda14cbcSMatt Macy if (newsize < tb->size) {
86eda14cbcSMatt Macy /* shrinking slice must be empty */
87eda14cbcSMatt Macy lua_assert(tb->hash[newsize] == NULL && tb->hash[tb->size - 1] == NULL);
88eda14cbcSMatt Macy luaM_reallocvector(L, tb->hash, tb->size, newsize, GCObject *);
89eda14cbcSMatt Macy }
90eda14cbcSMatt Macy tb->size = newsize;
91eda14cbcSMatt Macy }
92eda14cbcSMatt Macy
93eda14cbcSMatt Macy
94eda14cbcSMatt Macy /*
95eda14cbcSMatt Macy ** creates a new string object
96eda14cbcSMatt Macy */
createstrobj(lua_State * L,const char * str,size_t l,int tag,unsigned int h,GCObject ** list)97eda14cbcSMatt Macy static TString *createstrobj (lua_State *L, const char *str, size_t l,
98eda14cbcSMatt Macy int tag, unsigned int h, GCObject **list) {
99eda14cbcSMatt Macy TString *ts;
100eda14cbcSMatt Macy char *sbuf;
101eda14cbcSMatt Macy size_t totalsize; /* total size of TString object */
102eda14cbcSMatt Macy totalsize = sizeof(TString) + ((l + 1) * sizeof(char));
103eda14cbcSMatt Macy ts = &luaC_newobj(L, tag, totalsize, list, 0)->ts;
104eda14cbcSMatt Macy ts->tsv.len = l;
105eda14cbcSMatt Macy ts->tsv.hash = h;
106eda14cbcSMatt Macy ts->tsv.extra = 0;
1077a7741afSMartin Matuska sbuf = ts->contents;
108eda14cbcSMatt Macy memcpy(sbuf, str, l*sizeof(char));
109eda14cbcSMatt Macy sbuf[l] = '\0'; /* ending 0 */
110eda14cbcSMatt Macy return ts;
111eda14cbcSMatt Macy }
112eda14cbcSMatt Macy
113eda14cbcSMatt Macy
114eda14cbcSMatt Macy /*
115eda14cbcSMatt Macy ** creates a new short string, inserting it into string table
116eda14cbcSMatt Macy */
newshrstr(lua_State * L,const char * str,size_t l,unsigned int h)117eda14cbcSMatt Macy static TString *newshrstr (lua_State *L, const char *str, size_t l,
118eda14cbcSMatt Macy unsigned int h) {
119eda14cbcSMatt Macy GCObject **list; /* (pointer to) list where it will be inserted */
120eda14cbcSMatt Macy stringtable *tb = &G(L)->strt;
121eda14cbcSMatt Macy TString *s;
122eda14cbcSMatt Macy if (tb->nuse >= cast(lu_int32, tb->size) && tb->size <= MAX_INT/2)
123eda14cbcSMatt Macy luaS_resize(L, tb->size*2); /* too crowded */
124eda14cbcSMatt Macy list = &tb->hash[lmod(h, tb->size)];
125eda14cbcSMatt Macy s = createstrobj(L, str, l, LUA_TSHRSTR, h, list);
126eda14cbcSMatt Macy tb->nuse++;
127eda14cbcSMatt Macy return s;
128eda14cbcSMatt Macy }
129eda14cbcSMatt Macy
130eda14cbcSMatt Macy
131eda14cbcSMatt Macy /*
132eda14cbcSMatt Macy ** checks whether short string exists and reuses it or creates a new one
133eda14cbcSMatt Macy */
internshrstr(lua_State * L,const char * str,size_t l)134eda14cbcSMatt Macy static TString *internshrstr (lua_State *L, const char *str, size_t l) {
135eda14cbcSMatt Macy GCObject *o;
136eda14cbcSMatt Macy global_State *g = G(L);
137eda14cbcSMatt Macy unsigned int h = luaS_hash(str, l, g->seed);
138eda14cbcSMatt Macy for (o = g->strt.hash[lmod(h, g->strt.size)];
139eda14cbcSMatt Macy o != NULL;
140eda14cbcSMatt Macy o = gch(o)->next) {
141eda14cbcSMatt Macy TString *ts = rawgco2ts(o);
142eda14cbcSMatt Macy if (h == ts->tsv.hash &&
143eda14cbcSMatt Macy l == ts->tsv.len &&
144eda14cbcSMatt Macy (memcmp(str, getstr(ts), l * sizeof(char)) == 0)) {
145eda14cbcSMatt Macy if (isdead(G(L), o)) /* string is dead (but was not collected yet)? */
146eda14cbcSMatt Macy changewhite(o); /* resurrect it */
147eda14cbcSMatt Macy return ts;
148eda14cbcSMatt Macy }
149eda14cbcSMatt Macy }
150eda14cbcSMatt Macy return newshrstr(L, str, l, h); /* not found; create a new string */
151eda14cbcSMatt Macy }
152eda14cbcSMatt Macy
153eda14cbcSMatt Macy
154eda14cbcSMatt Macy /*
155eda14cbcSMatt Macy ** new string (with explicit length)
156eda14cbcSMatt Macy */
luaS_newlstr(lua_State * L,const char * str,size_t l)157eda14cbcSMatt Macy TString *luaS_newlstr (lua_State *L, const char *str, size_t l) {
158eda14cbcSMatt Macy if (l <= LUAI_MAXSHORTLEN) /* short string? */
159eda14cbcSMatt Macy return internshrstr(L, str, l);
160eda14cbcSMatt Macy else {
161eda14cbcSMatt Macy if (l + 1 > (MAX_SIZET - sizeof(TString))/sizeof(char))
162eda14cbcSMatt Macy luaM_toobig(L);
163eda14cbcSMatt Macy return createstrobj(L, str, l, LUA_TLNGSTR, G(L)->seed, NULL);
164eda14cbcSMatt Macy }
165eda14cbcSMatt Macy }
166eda14cbcSMatt Macy
167eda14cbcSMatt Macy
168eda14cbcSMatt Macy /*
169eda14cbcSMatt Macy ** new zero-terminated string
170eda14cbcSMatt Macy */
luaS_new(lua_State * L,const char * str)171eda14cbcSMatt Macy TString *luaS_new (lua_State *L, const char *str) {
172eda14cbcSMatt Macy return luaS_newlstr(L, str, strlen(str));
173eda14cbcSMatt Macy }
174eda14cbcSMatt Macy
175eda14cbcSMatt Macy
luaS_newudata(lua_State * L,size_t s,Table * e)176eda14cbcSMatt Macy Udata *luaS_newudata (lua_State *L, size_t s, Table *e) {
177eda14cbcSMatt Macy Udata *u;
178eda14cbcSMatt Macy if (s > MAX_SIZET - sizeof(Udata))
179eda14cbcSMatt Macy luaM_toobig(L);
180eda14cbcSMatt Macy u = &luaC_newobj(L, LUA_TUSERDATA, sizeof(Udata) + s, NULL, 0)->u;
181eda14cbcSMatt Macy u->uv.len = s;
182eda14cbcSMatt Macy u->uv.metatable = NULL;
183eda14cbcSMatt Macy u->uv.env = e;
184eda14cbcSMatt Macy return u;
185eda14cbcSMatt Macy }
186