xref: /freebsd/sys/contrib/openzfs/module/lua/lstring.c (revision 7a7741af18d6c8a804cc643cb7ecda9d730c6aa6)
1eda14cbcSMatt Macy /*
2eda14cbcSMatt Macy ** $Id: lstring.c,v 2.26.1.1 2013/04/12 18:48:47 roberto Exp $
3eda14cbcSMatt Macy ** String table (keeps all strings handled by Lua)
4eda14cbcSMatt Macy ** See Copyright Notice in lua.h
5eda14cbcSMatt Macy */
6eda14cbcSMatt Macy 
7eda14cbcSMatt Macy 
8eda14cbcSMatt Macy #define lstring_c
9eda14cbcSMatt Macy #define LUA_CORE
10eda14cbcSMatt Macy 
11eda14cbcSMatt Macy #include <sys/lua/lua.h>
12eda14cbcSMatt Macy 
13eda14cbcSMatt Macy #include "lmem.h"
14eda14cbcSMatt Macy #include "lobject.h"
15eda14cbcSMatt Macy #include "lstate.h"
16eda14cbcSMatt Macy #include "lstring.h"
17eda14cbcSMatt Macy 
18eda14cbcSMatt Macy 
19eda14cbcSMatt Macy /*
20eda14cbcSMatt Macy ** Lua will use at most ~(2^LUAI_HASHLIMIT) bytes from a string to
21eda14cbcSMatt Macy ** compute its hash
22eda14cbcSMatt Macy */
23eda14cbcSMatt Macy #if !defined(LUAI_HASHLIMIT)
24eda14cbcSMatt Macy #define LUAI_HASHLIMIT		5
25eda14cbcSMatt Macy #endif
26eda14cbcSMatt Macy 
27eda14cbcSMatt Macy 
28eda14cbcSMatt Macy /*
29eda14cbcSMatt Macy ** equality for long strings
30eda14cbcSMatt Macy */
31eda14cbcSMatt Macy int luaS_eqlngstr (TString *a, TString *b) {
32eda14cbcSMatt Macy   size_t len = a->tsv.len;
33eda14cbcSMatt Macy   lua_assert(a->tsv.tt == LUA_TLNGSTR && b->tsv.tt == LUA_TLNGSTR);
34eda14cbcSMatt Macy   return (a == b) ||  /* same instance or... */
35eda14cbcSMatt Macy     ((len == b->tsv.len) &&  /* equal length and ... */
36eda14cbcSMatt Macy      (memcmp(getstr(a), getstr(b), len) == 0));  /* equal contents */
37eda14cbcSMatt Macy }
38eda14cbcSMatt Macy 
39eda14cbcSMatt Macy 
40eda14cbcSMatt Macy /*
41eda14cbcSMatt Macy ** equality for strings
42eda14cbcSMatt Macy */
43eda14cbcSMatt Macy int luaS_eqstr (TString *a, TString *b) {
44eda14cbcSMatt Macy   return (a->tsv.tt == b->tsv.tt) &&
45eda14cbcSMatt Macy          (a->tsv.tt == LUA_TSHRSTR ? eqshrstr(a, b) : luaS_eqlngstr(a, b));
46eda14cbcSMatt Macy }
47eda14cbcSMatt Macy 
48eda14cbcSMatt Macy 
49eda14cbcSMatt Macy unsigned int luaS_hash (const char *str, size_t l, unsigned int seed) {
50eda14cbcSMatt Macy   unsigned int h = seed ^ cast(unsigned int, l);
51eda14cbcSMatt Macy   size_t l1;
52eda14cbcSMatt Macy   size_t step = (l >> LUAI_HASHLIMIT) + 1;
53eda14cbcSMatt Macy   for (l1 = l; l1 >= step; l1 -= step)
54eda14cbcSMatt Macy     h = h ^ ((h<<5) + (h>>2) + cast_byte(str[l1 - 1]));
55eda14cbcSMatt Macy   return h;
56eda14cbcSMatt Macy }
57eda14cbcSMatt Macy 
58eda14cbcSMatt Macy 
59eda14cbcSMatt Macy /*
60eda14cbcSMatt Macy ** resizes the string table
61eda14cbcSMatt Macy */
62eda14cbcSMatt Macy void luaS_resize (lua_State *L, int newsize) {
63eda14cbcSMatt Macy   int i;
64eda14cbcSMatt Macy   stringtable *tb = &G(L)->strt;
65eda14cbcSMatt Macy   /* cannot resize while GC is traversing strings */
66eda14cbcSMatt Macy   luaC_runtilstate(L, ~bitmask(GCSsweepstring));
67eda14cbcSMatt Macy   if (newsize > tb->size) {
68eda14cbcSMatt Macy     luaM_reallocvector(L, tb->hash, tb->size, newsize, GCObject *);
69eda14cbcSMatt Macy     for (i = tb->size; i < newsize; i++) tb->hash[i] = NULL;
70eda14cbcSMatt Macy   }
71eda14cbcSMatt Macy   /* rehash */
72eda14cbcSMatt Macy   for (i=0; i<tb->size; i++) {
73eda14cbcSMatt Macy     GCObject *p = tb->hash[i];
74eda14cbcSMatt Macy     tb->hash[i] = NULL;
75eda14cbcSMatt Macy     while (p) {  /* for each node in the list */
76eda14cbcSMatt Macy       GCObject *next = gch(p)->next;  /* save next */
77eda14cbcSMatt Macy       unsigned int h = lmod(gco2ts(p)->hash, newsize);  /* new position */
78eda14cbcSMatt Macy       gch(p)->next = tb->hash[h];  /* chain it */
79eda14cbcSMatt Macy       tb->hash[h] = p;
80eda14cbcSMatt Macy       resetoldbit(p);  /* see MOVE OLD rule */
81eda14cbcSMatt Macy       p = next;
82eda14cbcSMatt Macy     }
83eda14cbcSMatt Macy   }
84eda14cbcSMatt Macy   if (newsize < tb->size) {
85eda14cbcSMatt Macy     /* shrinking slice must be empty */
86eda14cbcSMatt Macy     lua_assert(tb->hash[newsize] == NULL && tb->hash[tb->size - 1] == NULL);
87eda14cbcSMatt Macy     luaM_reallocvector(L, tb->hash, tb->size, newsize, GCObject *);
88eda14cbcSMatt Macy   }
89eda14cbcSMatt Macy   tb->size = newsize;
90eda14cbcSMatt Macy }
91eda14cbcSMatt Macy 
92eda14cbcSMatt Macy 
93eda14cbcSMatt Macy /*
94eda14cbcSMatt Macy ** creates a new string object
95eda14cbcSMatt Macy */
96eda14cbcSMatt Macy static TString *createstrobj (lua_State *L, const char *str, size_t l,
97eda14cbcSMatt Macy                               int tag, unsigned int h, GCObject **list) {
98eda14cbcSMatt Macy   TString *ts;
99eda14cbcSMatt Macy   char *sbuf;
100eda14cbcSMatt Macy   size_t totalsize;  /* total size of TString object */
101eda14cbcSMatt Macy   totalsize = sizeof(TString) + ((l + 1) * sizeof(char));
102eda14cbcSMatt Macy   ts = &luaC_newobj(L, tag, totalsize, list, 0)->ts;
103eda14cbcSMatt Macy   ts->tsv.len = l;
104eda14cbcSMatt Macy   ts->tsv.hash = h;
105eda14cbcSMatt Macy   ts->tsv.extra = 0;
106*7a7741afSMartin Matuska   sbuf = ts->contents;
107eda14cbcSMatt Macy   memcpy(sbuf, str, l*sizeof(char));
108eda14cbcSMatt Macy   sbuf[l] = '\0';  /* ending 0 */
109eda14cbcSMatt Macy   return ts;
110eda14cbcSMatt Macy }
111eda14cbcSMatt Macy 
112eda14cbcSMatt Macy 
113eda14cbcSMatt Macy /*
114eda14cbcSMatt Macy ** creates a new short string, inserting it into string table
115eda14cbcSMatt Macy */
116eda14cbcSMatt Macy static TString *newshrstr (lua_State *L, const char *str, size_t l,
117eda14cbcSMatt Macy                                        unsigned int h) {
118eda14cbcSMatt Macy   GCObject **list;  /* (pointer to) list where it will be inserted */
119eda14cbcSMatt Macy   stringtable *tb = &G(L)->strt;
120eda14cbcSMatt Macy   TString *s;
121eda14cbcSMatt Macy   if (tb->nuse >= cast(lu_int32, tb->size) && tb->size <= MAX_INT/2)
122eda14cbcSMatt Macy     luaS_resize(L, tb->size*2);  /* too crowded */
123eda14cbcSMatt Macy   list = &tb->hash[lmod(h, tb->size)];
124eda14cbcSMatt Macy   s = createstrobj(L, str, l, LUA_TSHRSTR, h, list);
125eda14cbcSMatt Macy   tb->nuse++;
126eda14cbcSMatt Macy   return s;
127eda14cbcSMatt Macy }
128eda14cbcSMatt Macy 
129eda14cbcSMatt Macy 
130eda14cbcSMatt Macy /*
131eda14cbcSMatt Macy ** checks whether short string exists and reuses it or creates a new one
132eda14cbcSMatt Macy */
133eda14cbcSMatt Macy static TString *internshrstr (lua_State *L, const char *str, size_t l) {
134eda14cbcSMatt Macy   GCObject *o;
135eda14cbcSMatt Macy   global_State *g = G(L);
136eda14cbcSMatt Macy   unsigned int h = luaS_hash(str, l, g->seed);
137eda14cbcSMatt Macy   for (o = g->strt.hash[lmod(h, g->strt.size)];
138eda14cbcSMatt Macy        o != NULL;
139eda14cbcSMatt Macy        o = gch(o)->next) {
140eda14cbcSMatt Macy     TString *ts = rawgco2ts(o);
141eda14cbcSMatt Macy     if (h == ts->tsv.hash &&
142eda14cbcSMatt Macy         l == ts->tsv.len &&
143eda14cbcSMatt Macy         (memcmp(str, getstr(ts), l * sizeof(char)) == 0)) {
144eda14cbcSMatt Macy       if (isdead(G(L), o))  /* string is dead (but was not collected yet)? */
145eda14cbcSMatt Macy         changewhite(o);  /* resurrect it */
146eda14cbcSMatt Macy       return ts;
147eda14cbcSMatt Macy     }
148eda14cbcSMatt Macy   }
149eda14cbcSMatt Macy   return newshrstr(L, str, l, h);  /* not found; create a new string */
150eda14cbcSMatt Macy }
151eda14cbcSMatt Macy 
152eda14cbcSMatt Macy 
153eda14cbcSMatt Macy /*
154eda14cbcSMatt Macy ** new string (with explicit length)
155eda14cbcSMatt Macy */
156eda14cbcSMatt Macy TString *luaS_newlstr (lua_State *L, const char *str, size_t l) {
157eda14cbcSMatt Macy   if (l <= LUAI_MAXSHORTLEN)  /* short string? */
158eda14cbcSMatt Macy     return internshrstr(L, str, l);
159eda14cbcSMatt Macy   else {
160eda14cbcSMatt Macy     if (l + 1 > (MAX_SIZET - sizeof(TString))/sizeof(char))
161eda14cbcSMatt Macy       luaM_toobig(L);
162eda14cbcSMatt Macy     return createstrobj(L, str, l, LUA_TLNGSTR, G(L)->seed, NULL);
163eda14cbcSMatt Macy   }
164eda14cbcSMatt Macy }
165eda14cbcSMatt Macy 
166eda14cbcSMatt Macy 
167eda14cbcSMatt Macy /*
168eda14cbcSMatt Macy ** new zero-terminated string
169eda14cbcSMatt Macy */
170eda14cbcSMatt Macy TString *luaS_new (lua_State *L, const char *str) {
171eda14cbcSMatt Macy   return luaS_newlstr(L, str, strlen(str));
172eda14cbcSMatt Macy }
173eda14cbcSMatt Macy 
174eda14cbcSMatt Macy 
175eda14cbcSMatt Macy Udata *luaS_newudata (lua_State *L, size_t s, Table *e) {
176eda14cbcSMatt Macy   Udata *u;
177eda14cbcSMatt Macy   if (s > MAX_SIZET - sizeof(Udata))
178eda14cbcSMatt Macy     luaM_toobig(L);
179eda14cbcSMatt Macy   u = &luaC_newobj(L, LUA_TUSERDATA, sizeof(Udata) + s, NULL, 0)->u;
180eda14cbcSMatt Macy   u->uv.len = s;
181eda14cbcSMatt Macy   u->uv.metatable = NULL;
182eda14cbcSMatt Macy   u->uv.env = e;
183eda14cbcSMatt Macy   return u;
184eda14cbcSMatt Macy }
185