xref: /freebsd/sys/contrib/openzfs/module/lua/lstring.c (revision 61145dc2b94f12f6a47344fb9aac702321880e43)
1*61145dc2SMartin Matuska // SPDX-License-Identifier: MIT
2eda14cbcSMatt Macy /*
3eda14cbcSMatt Macy ** $Id: lstring.c,v 2.26.1.1 2013/04/12 18:48:47 roberto Exp $
4eda14cbcSMatt Macy ** String table (keeps all strings handled by Lua)
5eda14cbcSMatt Macy ** See Copyright Notice in lua.h
6eda14cbcSMatt Macy */
7eda14cbcSMatt Macy 
8eda14cbcSMatt Macy 
9eda14cbcSMatt Macy #define lstring_c
10eda14cbcSMatt Macy #define LUA_CORE
11eda14cbcSMatt Macy 
12eda14cbcSMatt Macy #include <sys/lua/lua.h>
13eda14cbcSMatt Macy 
14eda14cbcSMatt Macy #include "lmem.h"
15eda14cbcSMatt Macy #include "lobject.h"
16eda14cbcSMatt Macy #include "lstate.h"
17eda14cbcSMatt Macy #include "lstring.h"
18eda14cbcSMatt Macy 
19eda14cbcSMatt Macy 
20eda14cbcSMatt Macy /*
21eda14cbcSMatt Macy ** Lua will use at most ~(2^LUAI_HASHLIMIT) bytes from a string to
22eda14cbcSMatt Macy ** compute its hash
23eda14cbcSMatt Macy */
24eda14cbcSMatt Macy #if !defined(LUAI_HASHLIMIT)
25eda14cbcSMatt Macy #define LUAI_HASHLIMIT		5
26eda14cbcSMatt Macy #endif
27eda14cbcSMatt Macy 
28eda14cbcSMatt Macy 
29eda14cbcSMatt Macy /*
30eda14cbcSMatt Macy ** equality for long strings
31eda14cbcSMatt Macy */
luaS_eqlngstr(TString * a,TString * b)32eda14cbcSMatt Macy int luaS_eqlngstr (TString *a, TString *b) {
33eda14cbcSMatt Macy   size_t len = a->tsv.len;
34eda14cbcSMatt Macy   lua_assert(a->tsv.tt == LUA_TLNGSTR && b->tsv.tt == LUA_TLNGSTR);
35eda14cbcSMatt Macy   return (a == b) ||  /* same instance or... */
36eda14cbcSMatt Macy     ((len == b->tsv.len) &&  /* equal length and ... */
37eda14cbcSMatt Macy      (memcmp(getstr(a), getstr(b), len) == 0));  /* equal contents */
38eda14cbcSMatt Macy }
39eda14cbcSMatt Macy 
40eda14cbcSMatt Macy 
41eda14cbcSMatt Macy /*
42eda14cbcSMatt Macy ** equality for strings
43eda14cbcSMatt Macy */
luaS_eqstr(TString * a,TString * b)44eda14cbcSMatt Macy int luaS_eqstr (TString *a, TString *b) {
45eda14cbcSMatt Macy   return (a->tsv.tt == b->tsv.tt) &&
46eda14cbcSMatt Macy          (a->tsv.tt == LUA_TSHRSTR ? eqshrstr(a, b) : luaS_eqlngstr(a, b));
47eda14cbcSMatt Macy }
48eda14cbcSMatt Macy 
49eda14cbcSMatt Macy 
luaS_hash(const char * str,size_t l,unsigned int seed)50eda14cbcSMatt Macy unsigned int luaS_hash (const char *str, size_t l, unsigned int seed) {
51eda14cbcSMatt Macy   unsigned int h = seed ^ cast(unsigned int, l);
52eda14cbcSMatt Macy   size_t l1;
53eda14cbcSMatt Macy   size_t step = (l >> LUAI_HASHLIMIT) + 1;
54eda14cbcSMatt Macy   for (l1 = l; l1 >= step; l1 -= step)
55eda14cbcSMatt Macy     h = h ^ ((h<<5) + (h>>2) + cast_byte(str[l1 - 1]));
56eda14cbcSMatt Macy   return h;
57eda14cbcSMatt Macy }
58eda14cbcSMatt Macy 
59eda14cbcSMatt Macy 
60eda14cbcSMatt Macy /*
61eda14cbcSMatt Macy ** resizes the string table
62eda14cbcSMatt Macy */
luaS_resize(lua_State * L,int newsize)63eda14cbcSMatt Macy void luaS_resize (lua_State *L, int newsize) {
64eda14cbcSMatt Macy   int i;
65eda14cbcSMatt Macy   stringtable *tb = &G(L)->strt;
66eda14cbcSMatt Macy   /* cannot resize while GC is traversing strings */
67eda14cbcSMatt Macy   luaC_runtilstate(L, ~bitmask(GCSsweepstring));
68eda14cbcSMatt Macy   if (newsize > tb->size) {
69eda14cbcSMatt Macy     luaM_reallocvector(L, tb->hash, tb->size, newsize, GCObject *);
70eda14cbcSMatt Macy     for (i = tb->size; i < newsize; i++) tb->hash[i] = NULL;
71eda14cbcSMatt Macy   }
72eda14cbcSMatt Macy   /* rehash */
73eda14cbcSMatt Macy   for (i=0; i<tb->size; i++) {
74eda14cbcSMatt Macy     GCObject *p = tb->hash[i];
75eda14cbcSMatt Macy     tb->hash[i] = NULL;
76eda14cbcSMatt Macy     while (p) {  /* for each node in the list */
77eda14cbcSMatt Macy       GCObject *next = gch(p)->next;  /* save next */
78eda14cbcSMatt Macy       unsigned int h = lmod(gco2ts(p)->hash, newsize);  /* new position */
79eda14cbcSMatt Macy       gch(p)->next = tb->hash[h];  /* chain it */
80eda14cbcSMatt Macy       tb->hash[h] = p;
81eda14cbcSMatt Macy       resetoldbit(p);  /* see MOVE OLD rule */
82eda14cbcSMatt Macy       p = next;
83eda14cbcSMatt Macy     }
84eda14cbcSMatt Macy   }
85eda14cbcSMatt Macy   if (newsize < tb->size) {
86eda14cbcSMatt Macy     /* shrinking slice must be empty */
87eda14cbcSMatt Macy     lua_assert(tb->hash[newsize] == NULL && tb->hash[tb->size - 1] == NULL);
88eda14cbcSMatt Macy     luaM_reallocvector(L, tb->hash, tb->size, newsize, GCObject *);
89eda14cbcSMatt Macy   }
90eda14cbcSMatt Macy   tb->size = newsize;
91eda14cbcSMatt Macy }
92eda14cbcSMatt Macy 
93eda14cbcSMatt Macy 
94eda14cbcSMatt Macy /*
95eda14cbcSMatt Macy ** creates a new string object
96eda14cbcSMatt Macy */
createstrobj(lua_State * L,const char * str,size_t l,int tag,unsigned int h,GCObject ** list)97eda14cbcSMatt Macy static TString *createstrobj (lua_State *L, const char *str, size_t l,
98eda14cbcSMatt Macy                               int tag, unsigned int h, GCObject **list) {
99eda14cbcSMatt Macy   TString *ts;
100eda14cbcSMatt Macy   char *sbuf;
101eda14cbcSMatt Macy   size_t totalsize;  /* total size of TString object */
102eda14cbcSMatt Macy   totalsize = sizeof(TString) + ((l + 1) * sizeof(char));
103eda14cbcSMatt Macy   ts = &luaC_newobj(L, tag, totalsize, list, 0)->ts;
104eda14cbcSMatt Macy   ts->tsv.len = l;
105eda14cbcSMatt Macy   ts->tsv.hash = h;
106eda14cbcSMatt Macy   ts->tsv.extra = 0;
1077a7741afSMartin Matuska   sbuf = ts->contents;
108eda14cbcSMatt Macy   memcpy(sbuf, str, l*sizeof(char));
109eda14cbcSMatt Macy   sbuf[l] = '\0';  /* ending 0 */
110eda14cbcSMatt Macy   return ts;
111eda14cbcSMatt Macy }
112eda14cbcSMatt Macy 
113eda14cbcSMatt Macy 
114eda14cbcSMatt Macy /*
115eda14cbcSMatt Macy ** creates a new short string, inserting it into string table
116eda14cbcSMatt Macy */
newshrstr(lua_State * L,const char * str,size_t l,unsigned int h)117eda14cbcSMatt Macy static TString *newshrstr (lua_State *L, const char *str, size_t l,
118eda14cbcSMatt Macy                                        unsigned int h) {
119eda14cbcSMatt Macy   GCObject **list;  /* (pointer to) list where it will be inserted */
120eda14cbcSMatt Macy   stringtable *tb = &G(L)->strt;
121eda14cbcSMatt Macy   TString *s;
122eda14cbcSMatt Macy   if (tb->nuse >= cast(lu_int32, tb->size) && tb->size <= MAX_INT/2)
123eda14cbcSMatt Macy     luaS_resize(L, tb->size*2);  /* too crowded */
124eda14cbcSMatt Macy   list = &tb->hash[lmod(h, tb->size)];
125eda14cbcSMatt Macy   s = createstrobj(L, str, l, LUA_TSHRSTR, h, list);
126eda14cbcSMatt Macy   tb->nuse++;
127eda14cbcSMatt Macy   return s;
128eda14cbcSMatt Macy }
129eda14cbcSMatt Macy 
130eda14cbcSMatt Macy 
131eda14cbcSMatt Macy /*
132eda14cbcSMatt Macy ** checks whether short string exists and reuses it or creates a new one
133eda14cbcSMatt Macy */
internshrstr(lua_State * L,const char * str,size_t l)134eda14cbcSMatt Macy static TString *internshrstr (lua_State *L, const char *str, size_t l) {
135eda14cbcSMatt Macy   GCObject *o;
136eda14cbcSMatt Macy   global_State *g = G(L);
137eda14cbcSMatt Macy   unsigned int h = luaS_hash(str, l, g->seed);
138eda14cbcSMatt Macy   for (o = g->strt.hash[lmod(h, g->strt.size)];
139eda14cbcSMatt Macy        o != NULL;
140eda14cbcSMatt Macy        o = gch(o)->next) {
141eda14cbcSMatt Macy     TString *ts = rawgco2ts(o);
142eda14cbcSMatt Macy     if (h == ts->tsv.hash &&
143eda14cbcSMatt Macy         l == ts->tsv.len &&
144eda14cbcSMatt Macy         (memcmp(str, getstr(ts), l * sizeof(char)) == 0)) {
145eda14cbcSMatt Macy       if (isdead(G(L), o))  /* string is dead (but was not collected yet)? */
146eda14cbcSMatt Macy         changewhite(o);  /* resurrect it */
147eda14cbcSMatt Macy       return ts;
148eda14cbcSMatt Macy     }
149eda14cbcSMatt Macy   }
150eda14cbcSMatt Macy   return newshrstr(L, str, l, h);  /* not found; create a new string */
151eda14cbcSMatt Macy }
152eda14cbcSMatt Macy 
153eda14cbcSMatt Macy 
154eda14cbcSMatt Macy /*
155eda14cbcSMatt Macy ** new string (with explicit length)
156eda14cbcSMatt Macy */
luaS_newlstr(lua_State * L,const char * str,size_t l)157eda14cbcSMatt Macy TString *luaS_newlstr (lua_State *L, const char *str, size_t l) {
158eda14cbcSMatt Macy   if (l <= LUAI_MAXSHORTLEN)  /* short string? */
159eda14cbcSMatt Macy     return internshrstr(L, str, l);
160eda14cbcSMatt Macy   else {
161eda14cbcSMatt Macy     if (l + 1 > (MAX_SIZET - sizeof(TString))/sizeof(char))
162eda14cbcSMatt Macy       luaM_toobig(L);
163eda14cbcSMatt Macy     return createstrobj(L, str, l, LUA_TLNGSTR, G(L)->seed, NULL);
164eda14cbcSMatt Macy   }
165eda14cbcSMatt Macy }
166eda14cbcSMatt Macy 
167eda14cbcSMatt Macy 
168eda14cbcSMatt Macy /*
169eda14cbcSMatt Macy ** new zero-terminated string
170eda14cbcSMatt Macy */
luaS_new(lua_State * L,const char * str)171eda14cbcSMatt Macy TString *luaS_new (lua_State *L, const char *str) {
172eda14cbcSMatt Macy   return luaS_newlstr(L, str, strlen(str));
173eda14cbcSMatt Macy }
174eda14cbcSMatt Macy 
175eda14cbcSMatt Macy 
luaS_newudata(lua_State * L,size_t s,Table * e)176eda14cbcSMatt Macy Udata *luaS_newudata (lua_State *L, size_t s, Table *e) {
177eda14cbcSMatt Macy   Udata *u;
178eda14cbcSMatt Macy   if (s > MAX_SIZET - sizeof(Udata))
179eda14cbcSMatt Macy     luaM_toobig(L);
180eda14cbcSMatt Macy   u = &luaC_newobj(L, LUA_TUSERDATA, sizeof(Udata) + s, NULL, 0)->u;
181eda14cbcSMatt Macy   u->uv.len = s;
182eda14cbcSMatt Macy   u->uv.metatable = NULL;
183eda14cbcSMatt Macy   u->uv.env = e;
184eda14cbcSMatt Macy   return u;
185eda14cbcSMatt Macy }
186