Skip to content

Commit 8de4d97

Browse files
committed
Implement string reference counting in cnex
1 parent bf5bb08 commit 8de4d97

File tree

5 files changed

+123
-29
lines changed

5 files changed

+123
-29
lines changed

exec/cnex/cell.c

+19-3
Original file line numberDiff line numberDiff line change
@@ -229,7 +229,8 @@ Cell *cell_fromCell(const Cell *c)
229229
x->other = NULL;
230230
break;
231231
case cBytes:
232-
x->string = string_copyString(c->string);
232+
x->string = c->string;
233+
x->string->refcount++;
233234
x->boolean = FALSE;
234235
x->number = number_from_uint32(0);
235236
x->object = NULL;
@@ -270,7 +271,8 @@ Cell *cell_fromCell(const Cell *c)
270271
x->other = NULL;
271272
break;
272273
case cString:
273-
x->string = string_copyString(c->string);
274+
x->string = c->string;
275+
x->string->refcount++;
274276
x->address = NULL;
275277
x->number = number_from_uint32(0);
276278
x->object = NULL;
@@ -332,6 +334,16 @@ Cell *cell_fromCellValue(const Cell* c)
332334
x->array = NULL;
333335
x->other = NULL;
334336
break;
337+
case cString:
338+
x->string = string_copyString(c->string);
339+
x->address = NULL;
340+
x->number = number_from_uint32(0);
341+
x->object = NULL;
342+
x->boolean = FALSE;
343+
x->array = NULL;
344+
x->dictionary = NULL;
345+
x->other = NULL;
346+
break;
335347
default:
336348
cell_copyCell(x, c);
337349
break;
@@ -618,6 +630,9 @@ void cell_valueCopyCell(Cell *dest, const Cell *source)
618630
case cDictionary:
619631
dest->dictionary = dictionary_copyDictionary(source->dictionary);
620632
break;
633+
case cString:
634+
dest->string = string_copyString(source->string);
635+
break;
621636
default:
622637
cell_copyCell(dest, source);
623638
break;
@@ -634,7 +649,8 @@ void cell_copyCell(Cell *dest, const Cell *source)
634649
dest->number = source->number;
635650
// ToDo: Split strings and bytes into separate entities; once we implement actual UTF8 strings.
636651
if ((source->type == cString || source->type == cBytes) && source->string != NULL) {
637-
dest->string = string_copyString(source->string);
652+
dest->string = source->string;
653+
dest->string->refcount++;
638654
} else {
639655
dest->string = NULL;
640656
}

exec/cnex/cnex.c

+1-1
Original file line numberDiff line numberDiff line change
@@ -823,7 +823,7 @@ void exec_STORES(TExecutor *self)
823823
{
824824
self->ip++;
825825
Cell *addr = top(self->stack)->address; pop(self->stack);
826-
cell_copyCell(addr, top(self->stack)); pop(self->stack);
826+
cell_valueCopyCell(addr, top(self->stack)); pop(self->stack);
827827
}
828828

829829
void exec_STOREY(TExecutor *self)

exec/cnex/global.c

+2-2
Original file line numberDiff line numberDiff line change
@@ -1537,7 +1537,7 @@ void pointer__toString(TExecutor *exec)
15371537

15381538
void string__append(TExecutor *exec)
15391539
{
1540-
Cell *b = cell_fromCell(top(exec->stack)); pop(exec->stack);
1540+
Cell *b = cell_fromCellValue(top(exec->stack)); pop(exec->stack);
15411541
Cell *addr = top(exec->stack)->address; pop(exec->stack);
15421542

15431543
addr->string->data = realloc(addr->string->data, addr->string->length + b->string->length);
@@ -1581,7 +1581,7 @@ void string__toString(TExecutor *exec)
15811581
void string__index(TExecutor *exec)
15821582
{
15831583
Number index = top(exec->stack)->number; pop(exec->stack);
1584-
Cell *a = cell_fromCell(top(exec->stack)); pop(exec->stack);
1584+
Cell *a = cell_fromCellValue(top(exec->stack)); pop(exec->stack);
15851585

15861586
if (!number_is_integer(index)) {
15871587
char buf[100];

exec/cnex/nstring.c

+100-23
Original file line numberDiff line numberDiff line change
@@ -49,24 +49,29 @@ TString *string_newString(void)
4949
}
5050

5151
c->data = NULL;
52+
c->refcount = 1;
5253
c->length = 0;
5354
return c;
5455
}
5556

5657
void string_freeString(TString *s)
5758
{
5859
if (s) {
59-
free(s->data);
60-
s->data = NULL;
61-
s->length = 0;
60+
s->refcount--;
61+
if (s->refcount <= 0) {
62+
free(s->data);
63+
s->data = NULL;
64+
s->length = 0;
65+
free(s);
66+
}
6267
}
63-
free(s);
6468
}
6569

6670
void string_clearString(TString *s)
6771
{
6872
if (s) {
6973
if (s->data) {
74+
assert(s->refcount == 1);
7075
free(s->data);
7176
s->data = NULL;
7277
s->length = 0;
@@ -76,6 +81,7 @@ void string_clearString(TString *s)
7681

7782
TString *string_copyString(TString *s)
7883
{
84+
// Note: In the (new) copied string, the refcount is set back to 1, since this is a new string.
7985
TString *r = string_newString();
8086

8187
if (s->data) {
@@ -94,22 +100,37 @@ TString *string_copyString(TString *s)
94100

95101
TString *string_fromString(TString *s)
96102
{
97-
TString *r = string_newString();
103+
TString *r = NULL; // string_newString();
98104

99105
if (s != NULL) {
106+
if (s->refcount == 1) {
107+
s->refcount++;
108+
return s;
109+
//r->data = s->data;
110+
//r->length = s->length;
111+
//r->refcount = s->refcount;
112+
//return r;
113+
}
114+
115+
r = string_newString();
100116
r->length = s->length;
101117
r->data = malloc(r->length);
102118
if (r->data == NULL) {
103119
fatal_error("Unable to allocate new string data.");
104120
}
105121
memcpy(r->data, s->data, r->length);
122+
return r;
106123
}
107-
return r;
124+
return string_newString();
108125
}
109126

110127
int string_compareString(TString *lhs, TString *rhs)
111128
{
112129
int r = 0;
130+
// If the two pointers are the same, then it's equal.
131+
if (lhs == rhs) {
132+
return r;
133+
}
113134
uint64_t size = lhs->length;
114135

115136
if (lhs->length > rhs->length) {
@@ -181,20 +202,42 @@ TString *string_appendCString(TString *s, const char *ns)
181202
return s;
182203
}
183204

205+
// NOTE: This function can possibly return a new string, and the string passed in
206+
// should never be used! Only the returned string should be referenced after
207+
// a call to this function!
184208
TString *string_appendChar(TString *s, char c)
185209
{
186-
s->data = realloc(s->data, s->length + 1);
187-
if (s->data == NULL) {
210+
TString *r = s;
211+
if (r->refcount > 1) {
212+
// We have to create a new string, since more than one string is pointing to it.
213+
r = string_copyString(s);
214+
// Then remove our reference to the (old) string.
215+
string_freeString(s);
216+
}
217+
218+
r->data = realloc(r->data, r->length + 1);
219+
if (r->data == NULL) {
188220
fatal_error("Could not reallocate data for appended character.");
189221
}
190222

191-
s->length++;
192-
s->data[s->length-1] = c;
193-
return s;
223+
r->length++;
224+
r->data[r->length-1] = c;
225+
return r;
194226
}
195227

228+
// NOTE: This function can possibly return a new string, and the string passed in
229+
// should never be used! Only the returned string should be referenced after
230+
// a call to this function!
196231
TString *string_appendCodePoint(TString *s, uint32_t cp)
197232
{
233+
TString *r = s;
234+
if (r->refcount > 1) {
235+
// We have to create a new string, since more than one string is pointing to it.
236+
r = string_copyString(s);
237+
// Then remove our reference to the (old) string.
238+
string_freeString(s);
239+
}
240+
198241
char val[4];
199242
uint32_t lead_byte = 0x7F;
200243
int index = 0;
@@ -205,21 +248,33 @@ TString *string_appendCodePoint(TString *s, uint32_t cp)
205248
}
206249
val[index++] = (cp & lead_byte) | (~lead_byte << 1);
207250
while (index) {
208-
s = string_appendChar(s, val[--index]);
251+
r = string_appendChar(s, val[--index]);
209252
}
210-
return s;
253+
return r;
211254
}
212255

256+
// NOTE: This function can possibly return a new string, and the string passed in
257+
// should never be used! Only the returned string should be referenced after
258+
// a call to this function!
213259
TString *string_appendData(TString *s, char *buf, size_t len)
214260
{
215-
s->data = realloc(s->data, s->length + len);
216-
if (s->data == NULL) {
261+
TString *r = s;
262+
if (s->refcount > 1) {
263+
assert(s->refcount > 1);
264+
// We have to create a new string, since more than one string is pointing to it.
265+
r = string_copyString(s);
266+
// Then remove our reference to the (old) string.
267+
string_freeString(s);
268+
}
269+
270+
r->data = realloc(r->data, r->length + len);
271+
if (r->data == NULL) {
217272
fatal_error("Could not reallocate string for append data.");
218273
}
219274

220-
memcpy(&s->data[s->length], buf, len);
221-
s->length += len;
222-
return s;
275+
memcpy(&r->data[r->length], buf, len);
276+
r->length += len;
277+
return r;
223278
}
224279

225280
void string_resizeString(TString *s, size_t n)
@@ -233,14 +288,22 @@ void string_resizeString(TString *s, size_t n)
233288

234289
TString *string_appendString(TString *s, TString *ns)
235290
{
236-
s->data = realloc(s->data, s->length + ns->length);
237-
if (s->data == NULL) {
291+
TString *r = s;
292+
if (s->refcount > 1) {
293+
assert(s->refcount > 1);
294+
// We have to create a new string, since more than one string is pointing to it.
295+
r = string_copyString(s);
296+
// Then remove our reference to the (old) string.
297+
string_freeString(s);
298+
}
299+
r->data = realloc(r->data, r->length + ns->length);
300+
if (r->data == NULL) {
238301
fatal_error("Could not allocate appended TString data.");
239302
}
240303

241-
memcpy(&s->data[s->length], ns->data, ns->length);
242-
s->length += ns->length;
243-
return s;
304+
memcpy(&r->data[r->length], ns->data, ns->length);
305+
r->length += ns->length;
306+
return r;
244307
}
245308

246309
/* NOTE: The caller is responsible for freeing the string created from this function! */
@@ -486,6 +549,7 @@ const char *string_ensureNullTerminated(TString *s)
486549

487550
// NOTE: The following functions return NEW string objects from existing strings.
488551
// Return the middle part of a string, starting at pos, for count number of bytes.
552+
// NOTE: New string returned, so refcount will be set to 1 on the new string.
489553
TString *string_subString(TString *s, int64_t pos, int64_t count)
490554
{
491555
int64_t newLen = count;
@@ -505,6 +569,7 @@ TString *string_subString(TString *s, int64_t pos, int64_t count)
505569

506570
TString *string_toLowerCase(TString *s)
507571
{
572+
// Note: returned string will always have a refcount of 1.
508573
TString *r = string_createString(s->length);
509574

510575
for (size_t i = 0; i < s->length; i++) {
@@ -516,6 +581,7 @@ TString *string_toLowerCase(TString *s)
516581

517582
TString *string_toUpperCase(TString *s)
518583
{
584+
// Note: returned string will always have a refcount of 1.
519585
TString *r = string_createString(s->length);
520586

521587
for (size_t i = 0; i < s->length; i++) {
@@ -532,6 +598,8 @@ TString *string_toUpperCase(TString *s)
532598
TString *string_quoteInPlace(TString *s)
533599
{
534600
TString *r = string_quote(s);
601+
602+
// Do the modification on the provided string.
535603
free(s->data);
536604
s->data = r->data;
537605
s->length = r->length;
@@ -542,6 +610,9 @@ TString *string_quoteInPlace(TString *s)
542610
// This may not be the best place for this, because it is not part of
543611
// the implementation of TString, but is just a specific string utility
544612
// function. But there wasn't an obviously better place to put it.
613+
// NOTE: The returned string will have a refcount of 1, so a new string
614+
// is returned, in all cases. This means that we may have to call
615+
// string_freeString() on it when we're done with it.
545616
TString *string_quote(TString *s)
546617
{
547618
TString *r = string_newString();
@@ -573,6 +644,7 @@ TString *string_quote(TString *s)
573644
i++;
574645
if ((s->data[i] & 0xc0) != 0x80) {
575646
// Garbage data, give up.
647+
// Should this raise an exception?
576648
break;
577649
}
578650
c = (c << 6) | (s->data[i] & 0x3f);
@@ -606,6 +678,9 @@ TString *string_quote(TString *s)
606678
}
607679
}
608680
string_appendChar(r, '"');
681+
if (s->refcount > 1) {
682+
string_freeString(s);
683+
}
609684
return r;
610685
}
611686

@@ -642,6 +717,7 @@ size_t string_getLength(TString *s)
642717

643718
TString *string_index(TString *s, size_t index)
644719
{
720+
// Returned string will have a refcount of 1;
645721
TString *r = string_createString(0);
646722

647723
size_t idx = 0;
@@ -666,6 +742,7 @@ TString *string_index(TString *s, size_t index)
666742
c &= 0x01;
667743
n = 6;
668744
} else {
745+
// Should this exit cnex? What happens in neonx.exe?
669746
fatal_error("Invalid UTF8 in string: %02x", s->data[i]);
670747
}
671748
} else {

exec/cnex/nstring.h

+1
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,7 @@
1616

1717
typedef struct tagTString {
1818
size_t length;
19+
int refcount;
1920
char *data;
2021
} TString;
2122

0 commit comments

Comments
 (0)