@@ -49,24 +49,29 @@ TString *string_newString(void)
49
49
}
50
50
51
51
c -> data = NULL ;
52
+ c -> refcount = 1 ;
52
53
c -> length = 0 ;
53
54
return c ;
54
55
}
55
56
56
57
void string_freeString (TString * s )
57
58
{
58
59
if (s ) {
59
- free (s -> data );
60
- s -> data = NULL ;
61
- s -> length = 0 ;
60
+ s -> refcount -- ;
61
+ if (s -> refcount <= 0 ) {
62
+ free (s -> data );
63
+ s -> data = NULL ;
64
+ s -> length = 0 ;
65
+ free (s );
66
+ }
62
67
}
63
- free (s );
64
68
}
65
69
66
70
void string_clearString (TString * s )
67
71
{
68
72
if (s ) {
69
73
if (s -> data ) {
74
+ assert (s -> refcount == 1 );
70
75
free (s -> data );
71
76
s -> data = NULL ;
72
77
s -> length = 0 ;
@@ -76,6 +81,7 @@ void string_clearString(TString *s)
76
81
77
82
TString * string_copyString (TString * s )
78
83
{
84
+ // Note: In the (new) copied string, the refcount is set back to 1, since this is a new string.
79
85
TString * r = string_newString ();
80
86
81
87
if (s -> data ) {
@@ -94,22 +100,37 @@ TString *string_copyString(TString *s)
94
100
95
101
TString * string_fromString (TString * s )
96
102
{
97
- TString * r = string_newString ();
103
+ TString * r = NULL ; // string_newString();
98
104
99
105
if (s != NULL ) {
106
+ if (s -> refcount == 1 ) {
107
+ s -> refcount ++ ;
108
+ return s ;
109
+ //r->data = s->data;
110
+ //r->length = s->length;
111
+ //r->refcount = s->refcount;
112
+ //return r;
113
+ }
114
+
115
+ r = string_newString ();
100
116
r -> length = s -> length ;
101
117
r -> data = malloc (r -> length );
102
118
if (r -> data == NULL ) {
103
119
fatal_error ("Unable to allocate new string data." );
104
120
}
105
121
memcpy (r -> data , s -> data , r -> length );
122
+ return r ;
106
123
}
107
- return r ;
124
+ return string_newString () ;
108
125
}
109
126
110
127
int string_compareString (TString * lhs , TString * rhs )
111
128
{
112
129
int r = 0 ;
130
+ // If the two pointers are the same, then it's equal.
131
+ if (lhs == rhs ) {
132
+ return r ;
133
+ }
113
134
uint64_t size = lhs -> length ;
114
135
115
136
if (lhs -> length > rhs -> length ) {
@@ -181,20 +202,42 @@ TString *string_appendCString(TString *s, const char *ns)
181
202
return s ;
182
203
}
183
204
205
+ // NOTE: This function can possibly return a new string, and the string passed in
206
+ // should never be used! Only the returned string should be referenced after
207
+ // a call to this function!
184
208
TString * string_appendChar (TString * s , char c )
185
209
{
186
- s -> data = realloc (s -> data , s -> length + 1 );
187
- if (s -> data == NULL ) {
210
+ TString * r = s ;
211
+ if (r -> refcount > 1 ) {
212
+ // We have to create a new string, since more than one string is pointing to it.
213
+ r = string_copyString (s );
214
+ // Then remove our reference to the (old) string.
215
+ string_freeString (s );
216
+ }
217
+
218
+ r -> data = realloc (r -> data , r -> length + 1 );
219
+ if (r -> data == NULL ) {
188
220
fatal_error ("Could not reallocate data for appended character." );
189
221
}
190
222
191
- s -> length ++ ;
192
- s -> data [s -> length - 1 ] = c ;
193
- return s ;
223
+ r -> length ++ ;
224
+ r -> data [r -> length - 1 ] = c ;
225
+ return r ;
194
226
}
195
227
228
+ // NOTE: This function can possibly return a new string, and the string passed in
229
+ // should never be used! Only the returned string should be referenced after
230
+ // a call to this function!
196
231
TString * string_appendCodePoint (TString * s , uint32_t cp )
197
232
{
233
+ TString * r = s ;
234
+ if (r -> refcount > 1 ) {
235
+ // We have to create a new string, since more than one string is pointing to it.
236
+ r = string_copyString (s );
237
+ // Then remove our reference to the (old) string.
238
+ string_freeString (s );
239
+ }
240
+
198
241
char val [4 ];
199
242
uint32_t lead_byte = 0x7F ;
200
243
int index = 0 ;
@@ -205,21 +248,33 @@ TString *string_appendCodePoint(TString *s, uint32_t cp)
205
248
}
206
249
val [index ++ ] = (cp & lead_byte ) | (~lead_byte << 1 );
207
250
while (index ) {
208
- s = string_appendChar (s , val [-- index ]);
251
+ r = string_appendChar (s , val [-- index ]);
209
252
}
210
- return s ;
253
+ return r ;
211
254
}
212
255
256
+ // NOTE: This function can possibly return a new string, and the string passed in
257
+ // should never be used! Only the returned string should be referenced after
258
+ // a call to this function!
213
259
TString * string_appendData (TString * s , char * buf , size_t len )
214
260
{
215
- s -> data = realloc (s -> data , s -> length + len );
216
- if (s -> data == NULL ) {
261
+ TString * r = s ;
262
+ if (s -> refcount > 1 ) {
263
+ assert (s -> refcount > 1 );
264
+ // We have to create a new string, since more than one string is pointing to it.
265
+ r = string_copyString (s );
266
+ // Then remove our reference to the (old) string.
267
+ string_freeString (s );
268
+ }
269
+
270
+ r -> data = realloc (r -> data , r -> length + len );
271
+ if (r -> data == NULL ) {
217
272
fatal_error ("Could not reallocate string for append data." );
218
273
}
219
274
220
- memcpy (& s -> data [s -> length ], buf , len );
221
- s -> length += len ;
222
- return s ;
275
+ memcpy (& r -> data [r -> length ], buf , len );
276
+ r -> length += len ;
277
+ return r ;
223
278
}
224
279
225
280
void string_resizeString (TString * s , size_t n )
@@ -233,14 +288,22 @@ void string_resizeString(TString *s, size_t n)
233
288
234
289
TString * string_appendString (TString * s , TString * ns )
235
290
{
236
- s -> data = realloc (s -> data , s -> length + ns -> length );
237
- if (s -> data == NULL ) {
291
+ TString * r = s ;
292
+ if (s -> refcount > 1 ) {
293
+ assert (s -> refcount > 1 );
294
+ // We have to create a new string, since more than one string is pointing to it.
295
+ r = string_copyString (s );
296
+ // Then remove our reference to the (old) string.
297
+ string_freeString (s );
298
+ }
299
+ r -> data = realloc (r -> data , r -> length + ns -> length );
300
+ if (r -> data == NULL ) {
238
301
fatal_error ("Could not allocate appended TString data." );
239
302
}
240
303
241
- memcpy (& s -> data [s -> length ], ns -> data , ns -> length );
242
- s -> length += ns -> length ;
243
- return s ;
304
+ memcpy (& r -> data [r -> length ], ns -> data , ns -> length );
305
+ r -> length += ns -> length ;
306
+ return r ;
244
307
}
245
308
246
309
/* NOTE: The caller is responsible for freeing the string created from this function! */
@@ -486,6 +549,7 @@ const char *string_ensureNullTerminated(TString *s)
486
549
487
550
// NOTE: The following functions return NEW string objects from existing strings.
488
551
// Return the middle part of a string, starting at pos, for count number of bytes.
552
+ // NOTE: New string returned, so refcount will be set to 1 on the new string.
489
553
TString * string_subString (TString * s , int64_t pos , int64_t count )
490
554
{
491
555
int64_t newLen = count ;
@@ -505,6 +569,7 @@ TString *string_subString(TString *s, int64_t pos, int64_t count)
505
569
506
570
TString * string_toLowerCase (TString * s )
507
571
{
572
+ // Note: returned string will always have a refcount of 1.
508
573
TString * r = string_createString (s -> length );
509
574
510
575
for (size_t i = 0 ; i < s -> length ; i ++ ) {
@@ -516,6 +581,7 @@ TString *string_toLowerCase(TString *s)
516
581
517
582
TString * string_toUpperCase (TString * s )
518
583
{
584
+ // Note: returned string will always have a refcount of 1.
519
585
TString * r = string_createString (s -> length );
520
586
521
587
for (size_t i = 0 ; i < s -> length ; i ++ ) {
@@ -532,6 +598,8 @@ TString *string_toUpperCase(TString *s)
532
598
TString * string_quoteInPlace (TString * s )
533
599
{
534
600
TString * r = string_quote (s );
601
+
602
+ // Do the modification on the provided string.
535
603
free (s -> data );
536
604
s -> data = r -> data ;
537
605
s -> length = r -> length ;
@@ -542,6 +610,9 @@ TString *string_quoteInPlace(TString *s)
542
610
// This may not be the best place for this, because it is not part of
543
611
// the implementation of TString, but is just a specific string utility
544
612
// function. But there wasn't an obviously better place to put it.
613
+ // NOTE: The returned string will have a refcount of 1, so a new string
614
+ // is returned, in all cases. This means that we may have to call
615
+ // string_freeString() on it when we're done with it.
545
616
TString * string_quote (TString * s )
546
617
{
547
618
TString * r = string_newString ();
@@ -573,6 +644,7 @@ TString *string_quote(TString *s)
573
644
i ++ ;
574
645
if ((s -> data [i ] & 0xc0 ) != 0x80 ) {
575
646
// Garbage data, give up.
647
+ // Should this raise an exception?
576
648
break ;
577
649
}
578
650
c = (c << 6 ) | (s -> data [i ] & 0x3f );
@@ -606,6 +678,9 @@ TString *string_quote(TString *s)
606
678
}
607
679
}
608
680
string_appendChar (r , '"' );
681
+ if (s -> refcount > 1 ) {
682
+ string_freeString (s );
683
+ }
609
684
return r ;
610
685
}
611
686
@@ -642,6 +717,7 @@ size_t string_getLength(TString *s)
642
717
643
718
TString * string_index (TString * s , size_t index )
644
719
{
720
+ // Returned string will have a refcount of 1;
645
721
TString * r = string_createString (0 );
646
722
647
723
size_t idx = 0 ;
@@ -666,6 +742,7 @@ TString *string_index(TString *s, size_t index)
666
742
c &= 0x01 ;
667
743
n = 6 ;
668
744
} else {
745
+ // Should this exit cnex? What happens in neonx.exe?
669
746
fatal_error ("Invalid UTF8 in string: %02x" , s -> data [i ]);
670
747
}
671
748
} else {
0 commit comments