1
/* Copyright (C) 2000 MySQL AB
3
This program is free software; you can redistribute it and/or modify
4
it under the terms of the GNU General Public License as published by
5
the Free Software Foundation; version 2 of the License.
7
This program is distributed in the hope that it will be useful,
8
but WITHOUT ANY WARRANTY; without even the implied warranty of
9
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
10
GNU General Public License for more details.
12
You should have received a copy of the GNU General Public License
13
along with this program; if not, write to the Free Software
14
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */
16
/* This file is originally from the mysql distribution. Coded by monty */
18
#ifdef USE_PRAGMA_IMPLEMENTATION
19
#pragma implementation // gcc: Class implementation
22
#include <my_global.h>
27
#include <floatingpoint.h>
31
The following extern declarations are ok as these are interface functions
32
required by the string function
35
extern void sql_alloc(size_t size);
36
extern void sql_element_free(void *ptr);
38
#include "sql_string.h"
40
/*****************************************************************************
42
*****************************************************************************/
44
bool String::real_alloc(uint32 arg_length)
46
arg_length=ALIGN_SIZE(arg_length+1);
48
if (Alloced_length < arg_length)
51
if (!(Ptr=(char*) my_malloc(arg_length,MYF(MY_WME))))
53
Alloced_length=arg_length;
62
** Check that string is big enough. Set string[alloc_length] to 0
66
bool String::realloc(uint32 alloc_length)
68
uint32 len=ALIGN_SIZE(alloc_length+1);
69
if (Alloced_length < len)
74
if ((new_ptr= (char*) my_realloc(Ptr,len,MYF(MY_WME))))
80
return TRUE; // Signal error
82
else if ((new_ptr= (char*) my_malloc(len,MYF(MY_WME))))
84
if (str_length) // Avoid bugs in memcpy on AIX
85
memcpy(new_ptr,Ptr,str_length);
86
new_ptr[str_length]=0;
92
return TRUE; // Signal error
94
Ptr[alloc_length]=0; // This make other funcs shorter
98
bool String::set(longlong num, CHARSET_INFO *cs)
100
uint l=20*cs->mbmaxlen+1;
104
str_length=(uint32) (cs->cset->longlong10_to_str)(cs,Ptr,l,-10,num);
109
bool String::set(ulonglong num, CHARSET_INFO *cs)
111
uint l=20*cs->mbmaxlen+1;
115
str_length=(uint32) (cs->cset->longlong10_to_str)(cs,Ptr,l,10,num);
120
bool String::set(double num,uint decimals, CHARSET_INFO *cs)
126
if (decimals >= NOT_FIXED_DEC)
128
uint32 len= my_sprintf(buff,(buff, "%.14g",num));// Enough for a DATETIME
129
return copy(buff, len, &my_charset_latin1, cs, &dummy_errors);
132
buff[sizeof(buff)-1]=0; // Safety
133
snprintf(buff,sizeof(buff)-1, "%.*f",(int) decimals,num);
135
sprintf(buff,"%.*f",(int) decimals,num);
137
return copy(buff,(uint32) strlen(buff), &my_charset_latin1, cs,
146
Alloced_length=0; // Force realloc
147
return realloc(str_length);
152
bool String::copy(const String &str)
154
if (alloc(str.str_length))
156
str_length=str.str_length;
157
bmove(Ptr,str.Ptr,str_length); // May be overlapping
159
str_charset=str.str_charset;
163
bool String::copy(const char *str,uint32 arg_length, CHARSET_INFO *cs)
165
if (alloc(arg_length))
167
if ((str_length=arg_length))
168
memcpy(Ptr,str,arg_length);
176
Checks that the source string can be just copied to the destination string
182
arg_length Length of string to copy.
183
from_cs Character set to copy from
184
to_cs Character set to copy to
185
uint32 *offset Returns number of unaligned characters.
188
0 No conversion needed
189
1 Either character set conversion or adding leading zeros
190
(e.g. for UCS-2) must be done
193
to_cs may be NULL for "no conversion" if the system variable
194
character_set_results is NULL.
197
bool String::needs_conversion(uint32 arg_length,
198
CHARSET_INFO *from_cs,
204
(to_cs == &my_charset_bin) ||
205
(to_cs == from_cs) ||
206
my_charset_same(from_cs, to_cs) ||
207
((from_cs == &my_charset_bin) &&
208
(!(*offset=(arg_length % to_cs->mbminlen)))))
215
Copy a multi-byte character sets with adding leading zeros.
221
arg_length Length of string. This should NOT be dividable with
223
offset arg_length % cs->mb_minlength
224
cs Character set for 'str'
227
For real multi-byte, ascii incompatible charactser sets,
228
like UCS-2, add leading zeros if we have an incomplete character.
231
will automatically be converted into
239
bool String::copy_aligned(const char *str,uint32 arg_length, uint32 offset,
242
/* How many bytes are in incomplete character */
243
offset= cs->mbmaxlen - offset; /* How many zeros we should prepend */
244
DBUG_ASSERT(offset && offset != cs->mbmaxlen);
246
uint32 aligned_length= arg_length + offset;
247
if (alloc(aligned_length))
251
Note, this is only safe for little-endian UCS-2.
252
If we add big-endian UCS-2 sometimes, this code
253
will be more complicated. But it's OK for now.
255
bzero((char*) Ptr, offset);
256
memcpy(Ptr + offset, str, arg_length);
257
Ptr[aligned_length]=0;
258
/* str_length is always >= 0 as arg_length is != 0 */
259
str_length= aligned_length;
265
bool String::set_or_copy_aligned(const char *str,uint32 arg_length,
268
/* How many bytes are in incomplete character */
269
uint32 offset= (arg_length % cs->mbminlen);
271
if (!offset) /* All characters are complete, just copy */
273
set(str, arg_length, cs);
276
return copy_aligned(str, arg_length, offset, cs);
279
/* Copy with charset convertion */
281
bool String::copy(const char *str, uint32 arg_length,
282
CHARSET_INFO *from_cs, CHARSET_INFO *to_cs, uint *errors)
285
if (!needs_conversion(arg_length, from_cs, to_cs, &offset))
288
return copy(str, arg_length, to_cs);
290
if ((from_cs == &my_charset_bin) && offset)
293
return copy_aligned(str, arg_length, offset, to_cs);
295
uint32 new_length= to_cs->mbmaxlen*arg_length;
296
if (alloc(new_length))
298
str_length=copy_and_convert((char*) Ptr, new_length, to_cs,
299
str, arg_length, from_cs, errors);
306
Set a string to the value of a latin1-string, keeping the original charset
310
str String of a simple charset (latin1)
311
arg_length Length of string
314
If string object is of a simple character set, set it to point to the
316
If not, make a copy and convert it to the new character set.
320
1 Could not allocate result buffer
324
bool String::set_ascii(const char *str, uint32 arg_length)
326
if (str_charset->mbminlen == 1)
328
set(str, arg_length, str_charset);
332
return copy(str, arg_length, &my_charset_latin1, str_charset, &dummy_errors);
336
/* This is used by mysql.cc */
338
bool String::fill(uint32 max_length,char fill_char)
340
if (str_length > max_length)
341
Ptr[str_length=max_length]=0;
344
if (realloc(max_length))
346
bfill(Ptr+str_length,max_length-str_length,fill_char);
347
str_length=max_length;
352
void String::strip_sp()
354
while (str_length && my_isspace(str_charset,Ptr[str_length-1]))
358
bool String::append(const String &s)
362
if (realloc(str_length+s.length()))
364
memcpy(Ptr+str_length,s.ptr(),s.length());
365
str_length+=s.length();
372
Append an ASCII string to the a string of the current character set
375
bool String::append(const char *s,uint32 arg_length)
381
For an ASCII incompatible string, e.g. UCS-2, we need to convert
383
if (str_charset->mbminlen > 1)
385
uint32 add_length=arg_length * str_charset->mbmaxlen;
387
if (realloc(str_length+ add_length))
389
str_length+= copy_and_convert(Ptr+str_length, add_length, str_charset,
390
s, arg_length, &my_charset_latin1,
396
For an ASCII compatinble string we can just append.
398
if (realloc(str_length+arg_length))
400
memcpy(Ptr+str_length,s,arg_length);
401
str_length+=arg_length;
407
Append a 0-terminated ASCII string
410
bool String::append(const char *s)
412
return append(s, strlen(s));
417
Append a string in the given charset to the string
418
with character set recoding
421
bool String::append(const char *s,uint32 arg_length, CHARSET_INFO *cs)
425
if (needs_conversion(arg_length, cs, str_charset, &dummy_offset))
427
uint32 add_length= arg_length / cs->mbminlen * str_charset->mbmaxlen;
429
if (realloc(str_length + add_length))
431
str_length+= copy_and_convert(Ptr+str_length, add_length, str_charset,
432
s, arg_length, cs, &dummy_errors);
436
if (realloc(str_length + arg_length))
438
memcpy(Ptr + str_length, s, arg_length);
439
str_length+= arg_length;
445
bool String::append(IO_CACHE* file, uint32 arg_length)
447
if (realloc(str_length+arg_length))
449
if (my_b_read(file, (uchar*) Ptr + str_length, arg_length))
454
str_length+=arg_length;
458
bool String::append_with_prefill(const char *s,uint32 arg_length,
459
uint32 full_length, char fill_char)
461
int t_length= arg_length > full_length ? arg_length : full_length;
463
if (realloc(str_length + t_length))
465
t_length= full_length - arg_length;
468
bfill(Ptr+str_length, t_length, fill_char);
469
str_length=str_length + t_length;
471
append(s, arg_length);
475
uint32 String::numchars()
477
return str_charset->cset->numchars(str_charset, Ptr, Ptr+str_length);
480
int String::charpos(int i,uint32 offset)
484
return str_charset->cset->charpos(str_charset,Ptr+offset,Ptr+str_length,i);
487
int String::strstr(const String &s,uint32 offset)
489
if (s.length()+offset <= str_length)
492
return ((int) offset); // Empty string is always found
494
register const char *str = Ptr+offset;
495
register const char *search=s.ptr();
496
const char *end=Ptr+str_length-s.length()+1;
497
const char *search_end=s.ptr()+s.length();
501
if (*str++ == *search)
504
i=(char*) str; j=(char*) search+1;
505
while (j != search_end)
506
if (*i++ != *j++) goto skip;
507
return (int) (str-Ptr) -1;
515
** Search string from end. Offset is offset to the end of string
518
int String::strrstr(const String &s,uint32 offset)
520
if (s.length() <= offset && offset <= str_length)
523
return offset; // Empty string is always found
524
register const char *str = Ptr+offset-1;
525
register const char *search=s.ptr()+s.length()-1;
527
const char *end=Ptr+s.length()-2;
528
const char *search_end=s.ptr()-1;
532
if (*str-- == *search)
535
i=(char*) str; j=(char*) search-1;
536
while (j != search_end)
537
if (*i-- != *j--) goto skip;
538
return (int) (i-Ptr) +1;
546
Replace substring with string
547
If wrong parameter or not enough memory, do nothing
550
bool String::replace(uint32 offset,uint32 arg_length,const String &to)
552
return replace(offset,arg_length,to.ptr(),to.length());
555
bool String::replace(uint32 offset,uint32 arg_length,
556
const char *to, uint32 to_length)
558
long diff = (long) to_length-(long) arg_length;
559
if (offset+arg_length <= str_length)
564
memcpy(Ptr+offset,to,to_length);
565
bmove(Ptr+offset+to_length,Ptr+offset+arg_length,
566
str_length-offset-arg_length);
572
if (realloc(str_length+(uint32) diff))
574
bmove_upp((uchar*) Ptr+str_length+diff, (uchar*) Ptr+str_length,
575
str_length-offset-arg_length);
578
memcpy(Ptr+offset,to,to_length);
580
str_length+=(uint32) diff;
586
// added by Holyfoot for "geometry" needs
587
int String::reserve(uint32 space_needed, uint32 grow_by)
589
if (Alloced_length < str_length + space_needed)
591
if (realloc(Alloced_length + max(space_needed, grow_by) - 1))
597
void String::qs_append(const char *str, uint32 len)
599
memcpy(Ptr + str_length, str, len + 1);
603
void String::qs_append(double d)
605
char *buff = Ptr + str_length;
606
str_length+= my_gcvt(d, MY_GCVT_ARG_DOUBLE, FLOATING_POINT_BUFFER - 1, buff, NULL);
609
void String::qs_append(double *d)
612
float8get(ld, (char*) d);
616
void String::qs_append(int i)
618
char *buff= Ptr + str_length;
619
char *end= int10_to_str(i, buff, -10);
620
str_length+= (int) (end-buff);
623
void String::qs_append(uint i)
625
char *buff= Ptr + str_length;
626
char *end= int10_to_str(i, buff, 10);
627
str_length+= (int) (end-buff);
631
Compare strings according to collation, without end space.
640
Normally this is case sensitive comparison
649
int sortcmp(const String *s,const String *t, CHARSET_INFO *cs)
651
return cs->coll->strnncollsp(cs,
652
(unsigned char *) s->ptr(),s->length(),
653
(unsigned char *) t->ptr(),t->length(), 0);
658
Compare strings byte by byte. End spaces are also compared.
666
Strings are compared as a stream of unsigned chars
675
int stringcmp(const String *s,const String *t)
677
uint32 s_len=s->length(),t_len=t->length(),len=min(s_len,t_len);
678
int cmp= memcmp(s->ptr(), t->ptr(), len);
679
return (cmp) ? cmp : (int) (s_len - t_len);
683
String *copy_if_not_alloced(String *to,String *from,uint32 from_length)
685
if (from->Alloced_length >= from_length)
687
if (from->alloced || !to || from == to)
689
(void) from->realloc(from_length);
692
if (to->realloc(from_length))
693
return from; // Actually an error
694
if ((to->str_length=min(from->str_length,from_length)))
695
memcpy(to->Ptr,from->Ptr,to->str_length);
696
to->str_charset=from->str_charset;
701
/****************************************************************************
703
****************************************************************************/
706
copy a string from one character set to another
711
to_cs Character set of result string
713
from_length Length of from string
714
from_cs From character set
717
'to' must be big enough as form_length * to_cs->mbmaxlen
720
length of bytes copied to 'to'
725
copy_and_convert(char *to, uint32 to_length, CHARSET_INFO *to_cs,
726
const char *from, uint32 from_length, CHARSET_INFO *from_cs,
731
const uchar *from_end= (const uchar*) from+from_length;
733
uchar *to_end= (uchar*) to+to_length;
734
my_charset_conv_mb_wc mb_wc= from_cs->cset->mb_wc;
735
my_charset_conv_wc_mb wc_mb= to_cs->cset->wc_mb;
740
if ((cnvres= (*mb_wc)(from_cs, &wc, (uchar*) from,
743
else if (cnvres == MY_CS_ILSEQ)
749
else if (cnvres > MY_CS_TOOSMALL)
752
A correct multibyte sequence detected
753
But it doesn't have Unicode mapping.
760
break; // Not enough characters
763
if ((cnvres= (*wc_mb)(to_cs, wc, (uchar*) to, to_end)) > 0)
765
else if (cnvres == MY_CS_ILUNI && wc != '?')
774
*errors= error_count;
775
return (uint32) (to - to_start);
779
void String::print(String *str)
781
char *st= (char*)Ptr, *end= st+str_length;
782
for (; st < end; st++)
788
str->append(STRING_WITH_LEN("\\\\"));
791
str->append(STRING_WITH_LEN("\\0"));
794
str->append(STRING_WITH_LEN("\\'"));
797
str->append(STRING_WITH_LEN("\\n"));
800
str->append(STRING_WITH_LEN("\\r"));
803
str->append(STRING_WITH_LEN("\\z"));
813
Exchange state of this object and argument.
819
Target string will contain state of this object and vice versa.
822
void String::swap(String &s)
824
swap_variables(char *, Ptr, s.Ptr);
825
swap_variables(uint32, str_length, s.str_length);
826
swap_variables(uint32, Alloced_length, s.Alloced_length);
827
swap_variables(bool, alloced, s.alloced);
828
swap_variables(CHARSET_INFO*, str_charset, s.str_charset);