56
56
#include <sys/stat.h>
57
57
#include <sys/types.h>
59
#include <boost/array.hpp>
60
#include <boost/foreach.hpp>
61
59
#include <boost/program_options.hpp>
62
#include <boost/smart_ptr.hpp>
64
61
#include PCRE_HEADER
66
63
#include <stdarg.h>
67
64
#include <boost/unordered_map.hpp>
69
68
/* Added this for string translation. */
70
#include <drizzled/gettext.h>
71
#include <drizzled/type/time.h>
72
#include <drizzled/charset.h>
73
#include <drizzled/typelib.h>
69
#include "drizzled/gettext.h"
70
#include "drizzled/drizzle_time.h"
71
#include "drizzled/charset.h"
74
72
#include <drizzled/configmake.h>
76
#define PTR_BYTE_DIFF(A,B) (ptrdiff_t) (reinterpret_cast<const unsigned char*>(A) - reinterpret_cast<const unsigned char*>(B))
78
74
#ifndef DRIZZLE_RETURN_SERVER_GONE
79
75
#define DRIZZLE_RETURN_HANDSHAKE_FAILED DRIZZLE_RETURN_ERROR_CODE
171
165
uint32_t lineno; /* Current line in file */
174
static boost::array<st_test_file, 16> file_stack;
175
static st_test_file* cur_file;
168
static struct st_test_file file_stack[16];
169
static struct st_test_file* cur_file;
170
static struct st_test_file* file_stack_end;
177
173
static const CHARSET_INFO *charset_info= &my_charset_utf8_general_ci; /* Default charset */
183
179
static char *timer_file = NULL;
184
180
static uint64_t timer_start;
185
static void timer_output();
186
static uint64_t timer_now();
181
static void timer_output(void);
182
static uint64_t timer_now(void);
188
184
static uint64_t progress_start= 0;
395
390
struct st_match_err err[10];
399
static st_expected_errors saved_expected_errors;
393
static struct st_expected_errors saved_expected_errors;
404
397
char *query, *query_buf,*first_argument,*last_argument,*end;
405
398
int first_word_len, query_len;
406
399
bool abort_on_error;
407
400
st_expected_errors expected_errors;
408
401
string require_file;
402
enum enum_commands type;
412
405
: query(NULL), query_buf(NULL), first_argument(NULL), last_argument(NULL),
443
439
VAR* var_from_env(const char *, const char *);
444
440
VAR* var_init(VAR* v, const char *name, int name_len, const char *val,
442
void var_free(pair<string, VAR*> v);
446
443
VAR* var_get(const char *var_name, const char** var_name_end,
447
444
bool raw, bool ignore_not_existing);
448
445
void eval_expr(VAR* v, const char *p, const char** p_end);
449
446
bool match_delimiter(int c, const char *delim, uint32_t length);
450
447
void dump_result_to_reject_file(char *buf, int size);
451
448
void dump_result_to_log_file(const char *buf, int size);
452
void dump_warning_messages();
453
void dump_progress();
449
void dump_warning_messages(void);
450
void dump_progress(void);
455
452
void do_eval(string *query_eval, const char *query,
456
453
const char *query_end, bool pass_through_escape_chars);
461
458
static char *replace_column[MAX_COLUMNS];
462
459
static uint32_t max_replace_column= 0;
463
460
void do_get_replace_column(struct st_command*);
464
void free_replace_column();
461
void free_replace_column(void);
466
463
/* For replace */
467
464
void do_get_replace(struct st_command *command);
465
void free_replace(void);
470
467
/* For replace_regex */
471
468
void do_get_replace_regex(struct st_command *command);
469
void free_replace_regex(void);
472
void free_all_replace(void);
475
void free_all_replace(void){
477
free_replace_regex();
478
free_replace_column();
473
481
void replace_append_mem(string *ds, const char *val,
875
887
free(next_con->name);
880
static void close_files()
893
static void close_files(void)
882
for (; cur_file >= file_stack.data(); cur_file--)
896
for (; cur_file >= file_stack; cur_file--)
884
898
if (cur_file->file && cur_file->file != stdin)
885
900
fclose(cur_file->file);
886
free(const_cast<char*>(cur_file->file_name));
902
free((unsigned char*) cur_file->file_name);
887
903
cur_file->file_name= 0;
891
static void free_used_memory()
909
static void free_used_memory(void)
893
914
close_connections();
895
BOOST_FOREACH(var_hash_t::reference i, var_hash)
897
free(i.second->str_val);
898
free(i.second->env_s);
899
if (i.second->alloced)
916
for_each(var_hash.begin(), var_hash.end(), var_free);
902
917
var_hash.clear();
903
BOOST_FOREACH(vector<st_command*>::reference i, q_lines)
905
for (size_t i= 0; i < var_reg.size(); i++)
919
vector<st_command *>::iterator iter;
920
for (iter= q_lines.begin() ; iter < q_lines.end() ; iter++)
922
struct st_command * q_line= *iter;
926
for (i= 0; i < 10; i++)
907
928
if (var_reg[i].alloced_len)
908
929
free(var_reg[i].str_val);
910
932
free_all_replace();
1014
1039
/* Print include filestack */
1015
1040
fprintf(stderr, "The test '%s' is not supported by this installation\n",
1016
file_stack[0].file_name);
1041
file_stack->file_name);
1017
1042
fprintf(stderr, "Detected in file %s at line %d\n",
1018
1043
err_file->file_name, err_file->lineno);
1019
while (err_file != file_stack.data())
1044
while (err_file != file_stack)
1022
1047
fprintf(stderr, "included from %s at line %d\n",
1436
1463
char temp_file_path[FN_REFLEN];
1438
if ((fd= internal::create_temp_file(temp_file_path, TMPDIR,
1465
if ((fd= internal::create_temp_file(temp_file_path, NULL,
1439
1466
"tmp", MYF(MY_WME))) < 0)
1440
1467
die("Failed to create temporary file for ds");
1603
1630
VAR *var_init(VAR *v, const char *name, int name_len, const char *val,
1606
1635
if (!name_len && name)
1607
1636
name_len = strlen(name);
1608
1637
if (!val_len && val)
1609
1638
val_len = strlen(val) ;
1610
VAR *tmp_var = v ? v : (VAR*)malloc(sizeof(*tmp_var) + name_len+1);
1639
val_alloc_len = val_len + 16; /* room to grow */
1640
if (!(tmp_var=v) && !(tmp_var = (VAR*)malloc(sizeof(*tmp_var)
1642
die("Out of memory");
1612
tmp_var->name = name ? (char*)&tmp_var[1] : 0;
1644
tmp_var->name = (name) ? (char*) tmp_var + sizeof(*tmp_var) : 0;
1613
1645
tmp_var->alloced = (v == 0);
1615
int val_alloc_len = val_len + 16; /* room to grow */
1616
tmp_var->str_val = (char*)malloc(val_alloc_len+1);
1647
if (!(tmp_var->str_val = (char *)malloc(val_alloc_len+1)))
1648
die("Out of memory");
1618
1650
memcpy(tmp_var->name, name, name_len);
1624
1656
tmp_var->name_len = name_len;
1625
1657
tmp_var->str_val_len = val_len;
1626
1658
tmp_var->alloced_len = val_alloc_len;
1627
tmp_var->int_val = val ? atoi(val) : 0;
1628
tmp_var->int_dirty = false;
1659
tmp_var->int_val = (val) ? atoi(val) : 0;
1660
tmp_var->int_dirty = 0;
1629
1661
tmp_var->env_s = 0;
1630
1662
return tmp_var;
1666
void var_free(pair<string, VAR *> v)
1668
free(v.second->str_val);
1669
free(v.second->env_s);
1670
if (v.second->alloced)
1633
1675
VAR* var_from_env(const char *name, const char *def_val)
1635
const char *tmp= getenv(name);
1679
if (!(tmp = getenv(name)))
1638
return var_hash[name] = var_init(0, name, strlen(name), tmp, strlen(tmp));
1682
v = var_init(0, name, strlen(name), tmp, strlen(tmp));
1683
string var_name(name);
1684
var_hash.insert(make_pair(var_name, v));
1641
1689
VAR* var_get(const char *var_name, const char **var_name_end, bool raw,
1642
1690
bool ignore_not_existing)
1646
1695
if (*var_name != '$')
1648
1697
digit = *++var_name - '0';
1664
1713
die("Too long variable name: %s", save_var_name);
1666
1715
string save_var_name_str(save_var_name, length);
1667
var_hash_t::iterator iter= var_hash.find(save_var_name_str);
1716
boost::unordered_map<string, VAR*>::iterator iter=
1717
var_hash.find(save_var_name_str);
1668
1718
if (iter == var_hash.end())
1670
1720
char buff[MAX_VAR_NAME_LENGTH+1];
1701
1751
static VAR *var_obtain(const char *name, int len)
1703
1753
string var_name(name, len);
1704
var_hash_t::iterator iter= var_hash.find(var_name);
1754
boost::unordered_map<string, VAR*>::iterator iter=
1755
var_hash.find(var_name);
1705
1756
if (iter != var_hash.end())
1706
return iter->second;
1707
return var_hash[var_name] = var_init(0, name, len, "", 0);
1757
return (*iter).second;
1758
VAR *v = var_init(0, name, len, "", 0);
1759
var_hash.insert(make_pair(var_name, v));
2108
2163
internal::fn_format(buff, name, "", "", MY_UNPACK_FILENAME);
2165
if (cur_file == file_stack_end)
2166
die("Source directives are nesting too deep");
2111
if (cur_file == &*file_stack.end())
2112
die("Source directives are nesting too deep");
2113
2168
if (!(cur_file->file= fopen(buff, "r")))
3275
3341
sleep_val= opt_sleep;
3278
usleep(sleep_val * 1000000);
3344
usleep((uint32_t) (sleep_val * 1000000L));
3279
3345
command->last_argument= sleep_end;
3284
static void do_get_file_name(st_command *command, string &dest)
3350
static void do_get_file_name(struct st_command *command, string &dest)
3286
char *p= command->first_argument;
3352
char *p= command->first_argument, *name;
3288
3354
die("Missing file name argument");
3290
3356
while (*p && !my_isspace(charset_info,*p))
3321
3387
abort_not_supported_test("Test requires charset '%s'", charset_name);
3324
static void fill_global_error_names()
3326
drizzle_result_st res;
3327
drizzle_return_t ret;
3329
drizzle_con_st *con= &cur_con->con;
3331
global_error_names.clear();
3333
const std::string ds_query("select error_name, error_code "
3334
"from data_dictionary.errors");
3335
if (drizzle_query_str(con, &res, ds_query.c_str(), &ret) == NULL ||
3336
ret != DRIZZLE_RETURN_OK)
3338
if (ret == DRIZZLE_RETURN_ERROR_CODE)
3340
die("Error running query '%s': %d %s", ds_query.c_str(),
3341
drizzle_result_error_code(&res), drizzle_result_error(&res));
3342
drizzle_result_free(&res);
3346
die("Error running query '%s': %d %s", ds_query.c_str(), ret,
3347
drizzle_con_error(con));
3350
if (drizzle_result_column_count(&res) == 0 ||
3351
drizzle_result_buffer(&res) != DRIZZLE_RETURN_OK)
3353
drizzle_result_free(&res);
3354
die("Query '%s' didn't return a result set", ds_query.c_str());
3357
while ((row= drizzle_row_next(&res)) && row[0])
3360
Concatenate all fields in the first row with tab in between
3361
and assign that string to the $variable
3363
size_t *lengths= drizzle_row_field_sizes(&res);
3366
global_error_names[string(row[0], lengths[0])] = boost::lexical_cast<uint32_t>(string(row[1], lengths[1]));
3368
catch (boost::bad_lexical_cast &ex)
3370
drizzle_result_free(&res);
3371
die("Invalid error_code from Drizzle: %s", ex.what());
3376
drizzle_result_free(&res);
3379
3390
static uint32_t get_errcode_from_name(char *error_name, char *error_end)
3381
3392
size_t err_name_len= error_end - error_name;
3382
3393
string error_name_s(error_name, err_name_len);
3384
ErrorCodes::iterator it= global_error_names.find(error_name_s);
3385
if (it != global_error_names.end())
3388
die("Unknown SQL error name '%s'", error_name_s.c_str());
3395
uint32_t code= global_error_names.getErrorCode(error_name_s);
3398
die("Unknown SQL error name '%s'", error_name_s.c_str());
3392
3403
static void do_get_errcodes(struct st_command *command)
3455
3466
die("The error name definition must start with an uppercase E");
3459
/* Error name string */
3461
to->code.errnum= get_errcode_from_name(p, end);
3472
/* Check that the string passed to str2int only contain digits */
3473
while (*p && p != end)
3475
if (!my_isdigit(charset_info, *p))
3476
die("Invalid argument to error: '%s' - " \
3477
"the errno may only consist of digits[0-9]",
3478
command->first_argument);
3482
/* Convert the sting to int */
3483
istringstream buff(start);
3484
if ((buff >> val).fail())
3485
die("Invalid argument to error: '%s'", command->first_argument);
3487
to->code.errnum= (uint32_t) val;
3462
3488
to->type= ERR_ERRNO;
3466
die ("You must either use the SQLSTATE or built in drizzle error label, numbers are not accepted");
4697
4719
for (i = 0; i < num_fields; i++)
4699
4721
column= drizzle_column_next(res);
4700
if (row[i] && (drizzle_column_type(column) == DRIZZLE_COLUMN_TYPE_TINY))
4702
if (boost::lexical_cast<uint32_t>(row[i]))
4704
if ((drizzle_column_flags(column) & DRIZZLE_COLUMN_FLAGS_UNSIGNED))
4706
append_field(ds, i, column, "YES", 3, false);
4710
append_field(ds, i, column, "TRUE", 4, false);
4715
if ((drizzle_column_flags(column) & DRIZZLE_COLUMN_FLAGS_UNSIGNED))
4717
append_field(ds, i, column, "NO", 2, false);
4721
append_field(ds, i, column, "FALSE", 5, false);
4727
append_field(ds, i, column,
4728
(const char*)row[i], lengths[i], !row[i]);
4722
append_field(ds, i, column,
4723
(const char*)row[i], lengths[i], !row[i]);
4731
4725
if (!display_result_vertically)
4732
4726
ds->append("\n");
4770
4764
ds->append("\t", 1);
4771
4765
replace_append_uint(ds, drizzle_column_size(column));
4772
4766
ds->append("\t", 1);
4773
if (drizzle_column_type(column) == DRIZZLE_COLUMN_TYPE_TINY)
4775
replace_append_uint(ds, 1);
4779
replace_append_uint(ds, drizzle_column_max_size(column));
4767
replace_append_uint(ds, drizzle_column_max_size(column));
4781
4768
ds->append("\t", 1);
4782
4769
ds->append((char*) ((drizzle_column_flags(column) & DRIZZLE_COLUMN_FLAGS_NOT_NULL) ? "N" : "Y"), 1);
4783
4770
ds->append("\t", 1);
5319
5306
save= command->query[command->first_word_len-1];
5320
5307
command->query[command->first_word_len-1]= 0;
5321
if (command_typelib.find_type(command->query, 1+2) > 0)
5308
if (find_type(command->query, &command_typelib, 1+2) > 0)
5322
5309
die("Extra delimiter \";\" found");
5323
5310
command->query[command->first_word_len-1]= save;
5539
5527
next_con= connections + 1;
5541
5529
/* Init file stack */
5542
memset(file_stack.data(), 0, sizeof(file_stack));
5543
cur_file= file_stack.data();
5530
memset(file_stack, 0, sizeof(file_stack));
5532
file_stack + (sizeof(file_stack)/sizeof(struct st_test_file)) - 1;
5533
cur_file= file_stack;
5545
5535
/* Init block stack */
5546
5536
memset(block_stack, 0, sizeof(block_stack));
5581
5571
internal::fn_format(buff, tmp.c_str(), "", "", MY_UNPACK_FILENAME);
5582
assert(cur_file == file_stack.data() && cur_file->file == 0);
5572
assert(cur_file == file_stack && cur_file->file == 0);
5583
5573
if (!(cur_file->file= fopen(buff, "r")))
5585
5575
fprintf(stderr, _("Could not open '%s' for reading: errno = %d"), buff, errno);
6163
6151
start= buff= (char *)malloc(strlen(from)+1);
6166
6155
uint32_t column_number;
6168
char *to= get_string(&buff, &from, command);
6157
to= get_string(&buff, &from, command);
6169
6158
if (!(column_number= atoi(to)) || column_number > MAX_COLUMNS)
6170
6159
die("Wrong column number to replace_column in '%s'", command->query);
6208
6201
} POINTER_ARRAY;
6210
6203
struct st_replace;
6211
struct st_replace *init_replace(const char **from, const char **to, uint32_t count,
6212
char *word_end_chars);
6204
struct st_replace *init_replace(char * *from, char * *to, uint32_t count,
6205
char * word_end_chars);
6213
6206
int insert_pointer_name(POINTER_ARRAY *pa,char * name);
6214
6207
void replace_strings_append(struct st_replace *rep, string* ds,
6215
6208
const char *from, int len);
6209
void free_pointer_array(POINTER_ARRAY *pa);
6217
st_replace *glob_replace= NULL;
6218
// boost::scoped_ptr<st_replace> glob_replace;
6211
struct st_replace *glob_replace= NULL;
6221
6214
Get arguments for replace. The syntax is:
6266
6249
if (my_isspace(charset_info,i))
6268
6251
*pos=0; /* End pointer */
6269
if (!(glob_replace= init_replace(from_array.typelib.type_names,
6270
to_array.typelib.type_names,
6271
from_array.typelib.count,
6252
if (!(glob_replace= init_replace((char**) from_array.typelib.type_names,
6253
(char**) to_array.typelib.type_names,
6254
(uint32_t) from_array.typelib.count,
6272
6255
word_end_chars)))
6273
6256
die("Can't initialize replace from '%s'", command->query);
6274
6257
free_pointer_array(&from_array);
6369
6355
st_regex substition. At the end of substitutions buf points to the
6370
6356
one containing the final result.
6372
typedef vector<st_regex> regex_arr_t;
6375
6359
char* even_buf;
6377
6361
int even_buf_len;
6378
6362
int odd_buf_len;
6379
boost::array<char, 8 << 10> buf0_;
6380
boost::array<char, 8 << 10> buf1_;
6381
regex_arr_t regex_arr;
6384
boost::scoped_ptr<st_replace_regex> glob_replace_regex;
6365
struct st_replace_regex *glob_replace_regex= 0;
6386
6367
int reg_replace(char** buf_p, int* buf_len_p, char *pattern, char *replace,
6387
6368
char *string, int icase, int global);
6423
6404
Returns: st_replace_regex struct with pairs of substitutions
6426
st_replace_regex::st_replace_regex(char* expr)
6407
static struct st_replace_regex* init_replace_regex(char* expr)
6409
struct st_replace_regex* res;
6410
char* buf,*expr_end;
6428
6413
uint32_t expr_len= strlen(expr);
6429
6414
char last_c = 0;
6432
char* buf= new char[expr_len];
6433
char* expr_end= expr + expr_len;
6415
struct st_regex reg;
6417
res=(st_replace_regex*)malloc(sizeof(*res)+expr_len);
6420
my_init_dynamic_array(&res->regex_arr,sizeof(struct st_regex),128,128);
6422
buf= (char*)res + sizeof(*res);
6423
expr_end= expr + expr_len;
6437
6427
/* for each regexp substitution statement */
6438
6428
while (p < expr_end)
6490
regex_arr.push_back(reg);
6481
/* done parsing the statement, now place it in regex_arr */
6482
if (insert_dynamic(&res->regex_arr,(unsigned char*) ®))
6483
die("Out of memory");
6492
odd_buf_len= even_buf_len= buf0_.size();
6493
even_buf= buf0_.data();
6494
odd_buf= buf1_.data();
6485
res->odd_buf_len= res->even_buf_len= 8192;
6486
res->even_buf= (char*)malloc(res->even_buf_len);
6487
res->odd_buf= (char*)malloc(res->odd_buf_len);
6488
res->buf= res->even_buf;
6500
6494
die("Error parsing replace_regex \"%s\"", expr);
6522
int st_replace_regex::multi_reg_replace(char* val)
6517
static int multi_reg_replace(struct st_replace_regex* r,char* val)
6525
char* out_buf= even_buf;
6526
int* buf_len_p= &even_buf_len;
6520
char* in_buf, *out_buf;
6524
out_buf= r->even_buf;
6525
buf_len_p= &r->even_buf_len;
6529
6528
/* For each substitution, do the replace */
6530
BOOST_FOREACH(regex_arr_t::const_reference i, regex_arr)
6529
for (i= 0; i < r->regex_arr.elements; i++)
6532
6532
char* save_out_buf= out_buf;
6533
if (!reg_replace(&out_buf, buf_len_p, i.pattern, i.replace,
6534
in_buf, i.icase, i.global))
6534
get_dynamic(&r->regex_arr,(unsigned char*)&re,i);
6536
if (!reg_replace(&out_buf, buf_len_p, re.pattern, re.replace,
6537
in_buf, re.icase, re.global))
6536
6539
/* if the buffer has been reallocated, make adjustements */
6537
6540
if (save_out_buf != out_buf)
6539
if (save_out_buf == even_buf)
6542
if (save_out_buf == r->even_buf)
6543
r->even_buf= out_buf;
6545
r->odd_buf= out_buf;
6545
6549
if (in_buf == val)
6547
std::swap(in_buf, out_buf);
6548
buf_len_p= (out_buf == even_buf) ? &even_buf_len : &odd_buf_len;
6552
std::swap(in_buf,out_buf);
6554
buf_len_p= (out_buf == r->even_buf) ? &r->even_buf_len :
6559
return (r->buf == 0);
6563
6571
void do_get_replace_regex(struct st_command *command)
6565
6573
char *expr= command->first_argument;
6566
glob_replace_regex.reset(new st_replace_regex(expr));
6574
free_replace_regex();
6575
if (!(glob_replace_regex=init_replace_regex(expr)))
6576
die("Could not init replace_regex");
6567
6577
command->last_argument= command->end;
6580
void free_replace_regex()
6582
if (glob_replace_regex)
6584
delete_dynamic(&glob_replace_regex->regex_arr);
6585
free(glob_replace_regex->even_buf);
6586
free(glob_replace_regex->odd_buf);
6587
free(glob_replace_regex);
6588
glob_replace_regex=0;
6571
6595
Performs a regex substitution
6673
6697
#define SET_MALLOC_HUNC 64
6674
6698
#define LAST_CHAR_CODE 259
6679
void internal_set_bit(uint32_t bit);
6680
void internal_clear_bit(uint32_t bit);
6681
void or_bits(const REP_SET *from);
6682
void copy_bits(const REP_SET *from);
6683
int cmp_bits(const REP_SET *set2) const;
6684
int get_next_bit(uint32_t lastpos) const;
6700
typedef struct st_rep_set {
6686
6701
uint32_t *bits; /* Pointer to used sets */
6687
6702
short next[LAST_CHAR_CODE]; /* Pointer to next sets */
6688
6703
uint32_t found_len; /* Best match to date */
6689
6704
int found_offset;
6690
6705
uint32_t table_offset;
6691
6706
uint32_t size_of_bits; /* For convinience */
6697
int find_set(const REP_SET *find);
6698
void free_last_set();
6700
void make_sets_invisible();
6709
typedef struct st_rep_sets {
6702
6710
uint32_t count; /* Number of sets */
6703
6711
uint32_t extra; /* Extra sets in buffer */
6704
uint32_t invisible; /* Sets not shown */
6712
uint32_t invisible; /* Sets not chown */
6705
6713
uint32_t size_of_bits;
6706
6714
REP_SET *set,*set_buffer;
6707
6715
uint32_t *bit_buffer;
6718
typedef struct st_found_set {
6712
6719
uint32_t table_offset;
6713
6720
int found_offset;
6723
typedef struct st_follow {
6719
6725
uint32_t table_offset;
6723
int init_sets(REP_SETS *sets, uint32_t states);
6730
int init_sets(REP_SETS *sets,uint32_t states);
6724
6731
REP_SET *make_new_set(REP_SETS *sets);
6725
int find_found(FOUND_SET *found_set, uint32_t table_offset, int found_offset);
6727
static uint32_t found_sets= 0;
6729
static uint32_t replace_len(const char *str)
6732
void make_sets_invisible(REP_SETS *sets);
6733
void free_last_set(REP_SETS *sets);
6734
void free_sets(REP_SETS *sets);
6735
void internal_set_bit(REP_SET *set, uint32_t bit);
6736
void internal_clear_bit(REP_SET *set, uint32_t bit);
6737
void or_bits(REP_SET *to,REP_SET *from);
6738
void copy_bits(REP_SET *to,REP_SET *from);
6739
int cmp_bits(REP_SET *set1,REP_SET *set2);
6740
int get_next_bit(REP_SET *set,uint32_t lastpos);
6741
int find_set(REP_SETS *sets,REP_SET *find);
6742
int find_found(FOUND_SET *found_set,uint32_t table_offset,
6744
uint32_t start_at_word(char * pos);
6745
uint32_t end_of_word(char * pos);
6747
static uint32_t found_sets=0;
6750
static uint32_t replace_len(char * str)
6731
6752
uint32_t len=0;
6742
/* Return 1 if regexp starts with \b or ends with \b*/
6744
static bool start_at_word(const char *pos)
6746
return ((!memcmp(pos, "\\b",2) && pos[2]) || !memcmp(pos, "\\^", 2));
6749
static bool end_of_word(const char *pos)
6751
const char *end= strchr(pos, '\0');
6752
return (end > pos+2 && !memcmp(end-2, "\\b", 2)) || (end >= pos+2 && !memcmp(end-2, "\\$",2));
6755
6763
/* Init a replace structure for further calls */
6757
REPLACE *init_replace(const char **from, const char **to, uint32_t count, char *word_end_chars)
6765
REPLACE *init_replace(char * *from, char * *to,uint32_t count,
6766
char * word_end_chars)
6759
const int SPACE_CHAR= 256;
6760
const int START_OF_LINE= 257;
6761
const int END_OF_LINE= 258;
6768
static const int SPACE_CHAR= 256;
6769
static const int START_OF_LINE= 257;
6770
static const int END_OF_LINE= 258;
6763
6772
uint32_t i,j,states,set_nr,len,result_len,max_length,found_end,bits_set,bit_nr;
6764
6773
int used_sets,chr,default_state;
6765
6774
char used_chars[LAST_CHAR_CODE],is_word_end[256];
6766
char *to_pos, **to_array;
6775
char * pos, *to_pos, **to_array;
6777
REP_SET *set,*start_states,*word_states,*new_set;
6778
FOLLOWS *follow,*follow_ptr;
6780
FOUND_SET *found_set;
6781
REPLACE_STRING *rep_str;
6768
6784
/* Count number of states */
6769
6785
for (i=result_len=max_length=0 , states=2 ; i < count ; i++)
6783
6799
for (i=0 ; word_end_chars[i] ; i++)
6784
6800
is_word_end[(unsigned char) word_end_chars[i]]=1;
6787
REP_SET *set,*start_states,*word_states,*new_set;
6788
REPLACE_STRING *rep_str;
6789
if (init_sets(&sets, states))
6802
if (init_sets(&sets,states))
6792
vector<FOUND_SET> found_set(max_length * count);
6805
if (!(found_set= (FOUND_SET*) malloc(sizeof(FOUND_SET)*max_length*count)))
6793
6811
make_new_set(&sets); /* Set starting set */
6794
sets.make_sets_invisible(); /* Hide previus sets */
6812
make_sets_invisible(&sets); /* Hide previus sets */
6796
6814
word_states=make_new_set(&sets); /* Start of new word */
6797
6815
start_states=make_new_set(&sets); /* This is first state */
6798
vector<FOLLOWS> follow(states + 2);
6799
FOLLOWS *follow_ptr= &follow[1];
6816
if (!(follow=(FOLLOWS*) malloc((states+2)*sizeof(FOLLOWS))))
6800
6823
/* Init follow_ptr[] */
6801
for (i=0, states=1; i < count; i++)
6824
for (i=0, states=1, follow_ptr=follow+1 ; i < count ; i++)
6803
6826
if (from[i][0] == '\\' && from[i][1] == '^')
6805
start_states->internal_set_bit(states + 1);
6828
internal_set_bit(start_states,states+1);
6806
6829
if (!from[i][2])
6808
6831
start_states->table_offset=i;
6812
6835
else if (from[i][0] == '\\' && from[i][1] == '$')
6814
start_states->internal_set_bit(states);
6815
word_states->internal_set_bit(states);
6837
internal_set_bit(start_states,states);
6838
internal_set_bit(word_states,states);
6816
6839
if (!from[i][2] && start_states->table_offset == UINT32_MAX)
6818
6841
start_states->table_offset=i;
6824
word_states->internal_set_bit(states);
6847
internal_set_bit(word_states,states);
6825
6848
if (from[i][0] == '\\' && (from[i][1] == 'b' && from[i][2]))
6826
start_states->internal_set_bit(states + 1);
6849
internal_set_bit(start_states,states+1);
6828
start_states->internal_set_bit(states);
6851
internal_set_bit(start_states,states);
6831
for (pos= from[i], len=0; *pos ; pos++)
6853
for (pos=from[i], len=0; *pos ; pos++)
6833
6855
if (*pos == '\\' && *(pos+1))
6874
for (set_nr=0; set_nr < sets.count ; set_nr++)
6896
for (set_nr=0,pos=0 ; set_nr < sets.count ; set_nr++)
6876
6898
set=sets.set+set_nr;
6877
6899
default_state= 0; /* Start from beginning */
6879
6901
/* If end of found-string not found or start-set with current set */
6881
for (i= UINT32_MAX; (i= set->get_next_bit(i)) ;)
6903
for (i= UINT32_MAX; (i=get_next_bit(set,i)) ;)
6883
if (!follow[i].chr && !default_state)
6884
default_state= find_found(&found_set.front(), set->table_offset, set->found_offset+1);
6907
if (! default_state)
6908
default_state= find_found(found_set,set->table_offset,
6909
set->found_offset+1);
6886
sets.set[used_sets].copy_bits(set); /* Save set for changes */
6912
copy_bits(sets.set+used_sets,set); /* Save set for changes */
6887
6913
if (!default_state)
6888
sets.set[used_sets].or_bits(sets.set); /* Can restart from start */
6914
or_bits(sets.set+used_sets,sets.set); /* Can restart from start */
6890
6916
/* Find all chars that follows current sets */
6891
6917
memset(used_chars, 0, sizeof(used_chars));
6892
for (i= UINT32_MAX; (i= sets.set[used_sets].get_next_bit(i)) ;)
6918
for (i= UINT32_MAX; (i=get_next_bit(sets.set+used_sets,i)) ;)
6894
6920
used_chars[follow[i].chr]=1;
6895
6921
if ((follow[i].chr == SPACE_CHAR && !follow[i+1].chr &&
6928
6954
follow[i].len > found_end)
6929
6955
found_end=follow[i].len;
6930
6956
if (chr && follow[i].chr)
6931
new_set->internal_set_bit(i + 1); /* To next set */
6957
internal_set_bit(new_set,i+1); /* To next set */
6933
new_set->internal_set_bit(i);
6959
internal_set_bit(new_set,i);
6938
6964
new_set->found_len=0; /* Set for testing if first */
6940
for (i= UINT32_MAX; (i= new_set->get_next_bit(i)) ;)
6966
for (i= UINT32_MAX; (i=get_next_bit(new_set,i)) ;)
6942
6968
if ((follow[i].chr == SPACE_CHAR ||
6943
6969
follow[i].chr == END_OF_LINE) && ! chr)
6964
6990
if (bits_set == 1)
6966
set->next[chr] = find_found(&found_set.front(), new_set->table_offset, new_set->found_offset);
6967
sets.free_last_set();
6992
set->next[chr] = find_found(found_set,
6993
new_set->table_offset,
6994
new_set->found_offset);
6995
free_last_set(&sets);
6970
set->next[chr] = sets.find_set(new_set);
6998
set->next[chr] = find_set(&sets,new_set);
6973
set->next[chr] = sets.find_set(new_set);
7001
set->next[chr] = find_set(&sets,new_set);
6978
7006
/* Alloc replace structure for the replace-state-machine */
6980
REPLACE *replace= (REPLACE*)malloc(sizeof(REPLACE) * (sets.count)
6981
+ sizeof(REPLACE_STRING) * (found_sets + 1) + sizeof(char*) * count + result_len);
7008
if ((replace=(REPLACE*) malloc(sizeof(REPLACE)*(sets.count)+
7009
sizeof(REPLACE_STRING)*(found_sets+1)+
7010
sizeof(char *)*count+result_len)))
6984
7012
memset(replace, 0, sizeof(REPLACE)*(sets.count)+
6985
7013
sizeof(REPLACE_STRING)*(found_sets+1)+
6996
7024
rep_str[0].replace_string=0;
6997
7025
for (i=1 ; i <= found_sets ; i++)
6999
const char *pos= from[found_set[i-1].table_offset];
7027
pos=from[found_set[i-1].table_offset];
7000
7028
rep_str[i].found= !memcmp(pos, "\\^", 3) ? 2 : 1;
7001
rep_str[i].replace_string= to_array[found_set[i-1].table_offset];
7002
rep_str[i].to_offset= found_set[i-1].found_offset-start_at_word(pos);
7003
rep_str[i].from_offset= found_set[i-1].found_offset-replace_len(pos) + end_of_word(pos);
7029
rep_str[i].replace_string=to_array[found_set[i-1].table_offset];
7030
rep_str[i].to_offset=found_set[i-1].found_offset-start_at_word(pos);
7031
rep_str[i].from_offset=found_set[i-1].found_offset-replace_len(pos)+
7005
7034
for (i=0 ; i < sets.count ; i++)
7075
7106
return make_new_set(sets);
7078
void REP_SETS::free_last_set()
7084
void REP_SETS::free_sets()
7090
void REP_SET::internal_set_bit(uint32_t bit)
7092
bits[bit / WORD_BIT] |= 1 << (bit % WORD_BIT);
7095
void REP_SET::internal_clear_bit(uint32_t bit)
7097
bits[bit / WORD_BIT] &= ~ (1 << (bit % WORD_BIT));
7101
void REP_SET::or_bits(const REP_SET *from)
7103
for (uint32_t i= 0 ; i < size_of_bits; i++)
7104
bits[i]|=from->bits[i];
7107
void REP_SET::copy_bits(const REP_SET *from)
7109
memcpy(bits, from->bits, sizeof(uint32_t) * size_of_bits);
7112
int REP_SET::cmp_bits(const REP_SET *set2) const
7114
return memcmp(bits, set2->bits, sizeof(uint32_t) * size_of_bits);
7109
void free_last_set(REP_SETS *sets)
7116
void free_sets(REP_SETS *sets)
7118
free(sets->set_buffer);
7119
free(sets->bit_buffer);
7123
void internal_set_bit(REP_SET *set, uint32_t bit)
7125
set->bits[bit / WORD_BIT] |= 1 << (bit % WORD_BIT);
7129
void internal_clear_bit(REP_SET *set, uint32_t bit)
7131
set->bits[bit / WORD_BIT] &= ~ (1 << (bit % WORD_BIT));
7136
void or_bits(REP_SET *to,REP_SET *from)
7138
register uint32_t i;
7139
for (i=0 ; i < to->size_of_bits ; i++)
7140
to->bits[i]|=from->bits[i];
7144
void copy_bits(REP_SET *to,REP_SET *from)
7146
memcpy(to->bits,from->bits,
7147
(size_t) (sizeof(uint32_t) * to->size_of_bits));
7150
int cmp_bits(REP_SET *set1,REP_SET *set2)
7152
return memcmp(set1->bits,set2->bits, sizeof(uint32_t) * set1->size_of_bits);
7117
7156
/* Get next set bit from set. */
7119
int REP_SET::get_next_bit(uint32_t lastpos) const
7158
int get_next_bit(REP_SET *set,uint32_t lastpos)
7121
uint32_t *start= bits + ((lastpos+1) / WORD_BIT);
7122
uint32_t *end= bits + size_of_bits;
7123
uint32_t bits0= start[0] & ~((1 << ((lastpos+1) % WORD_BIT)) -1);
7125
while (!bits0 && ++start < end)
7160
uint32_t pos,*start,*end,bits;
7162
start=set->bits+ ((lastpos+1) / WORD_BIT);
7163
end=set->bits + set->size_of_bits;
7164
bits=start[0] & ~((1 << ((lastpos+1) % WORD_BIT)) -1);
7166
while (! bits && ++start < end)
7129
uint32_t pos= (start - bits) * WORD_BIT;
7130
while (!(bits0 & 1))
7170
pos=(uint32_t) (start-set->bits)*WORD_BIT;
7171
while (! (bits & 1))
7139
7180
free given set, else put in given set in sets and return its
7142
int REP_SETS::find_set(const REP_SET *find)
7183
int find_set(REP_SETS *sets,REP_SET *find)
7145
for (; i < count - 1; i++)
7186
for (i=0 ; i < sets->count-1 ; i++)
7147
if (!set[i].cmp_bits(find))
7188
if (!cmp_bits(sets->set+i,find))
7190
free_last_set(sets);
7160
7201
set->next[] == -1 is reserved for end without replaces.
7163
int find_found(FOUND_SET *found_set, uint32_t table_offset, int found_offset)
7204
int find_found(FOUND_SET *found_set,uint32_t table_offset, int found_offset)
7166
for (; i < found_sets; i++)
7207
for (i=0 ; (uint32_t) i < found_sets ; i++)
7168
7208
if (found_set[i].table_offset == table_offset &&
7169
7209
found_set[i].found_offset == found_offset)
7172
found_set[i].table_offset= table_offset;
7173
found_set[i].found_offset= found_offset;
7211
found_set[i].table_offset=table_offset;
7212
found_set[i].found_offset=found_offset;
7175
return - i - 2; // return new postion
7214
return -i-2; /* return new postion */
7217
/* Return 1 if regexp starts with \b or ends with \b*/
7219
uint32_t start_at_word(char * pos)
7221
return (((!memcmp(pos, "\\b",2) && pos[2]) ||
7222
!memcmp(pos, "\\^", 2)) ? 1 : 0);
7225
uint32_t end_of_word(char * pos)
7227
char * end= strchr(pos, '\0');
7228
return ((end > pos+2 && !memcmp(end-2, "\\b", 2)) ||
7229
(end >= pos+2 && !memcmp(end-2, "\\$",2))) ? 1 : 0;
7178
7232
/****************************************************************************
7251
7305
} /* insert_pointer_name */
7308
/* free pointer array */
7310
void free_pointer_array(POINTER_ARRAY *pa)
7312
if (pa->typelib.count)
7314
pa->typelib.count=0;
7315
free((char*) pa->typelib.type_names);
7316
pa->typelib.type_names=0;
7319
} /* free_pointer_array */
7254
7322
/* Functions that uses replace and replace_regex */
7256
7324
/* Append the string to ds, with optional replace */
7257
void replace_append_mem(string *ds, const char *val, int len)
7325
void replace_append_mem(string *ds,
7326
const char *val, int len)
7259
7328
char *v= strdup(val);
7261
if (glob_replace_regex && !glob_replace_regex->multi_reg_replace(v))
7330
if (glob_replace_regex)
7263
v= glob_replace_regex->buf_;
7333
if (!multi_reg_replace(glob_replace_regex, v))
7335
v= glob_replace_regex->buf;
7266
7340
if (glob_replace)
7268
7342
/* Normal replace */
7269
7343
replace_strings_append(glob_replace, ds, v, len);
7272
7347
ds->append(v, len);