-
Notifications
You must be signed in to change notification settings - Fork 4k
/
Copy pathregular_expressions.cc
263 lines (227 loc) · 10 KB
/
regular_expressions.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
/* Copyright (c) 2019, 2025, Oracle and/or its affiliates.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License, version 2.0,
as published by the Free Software Foundation.
This program is designed to work with certain software (including
but not limited to OpenSSL) that is licensed under separate terms,
as designated in a particular file or component or in included license
documentation. The authors of MySQL hereby grant you an additional
permission to link the program and your derivative works with the
separately licensed software that they have either included with
the program or referenced in the documentation.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License, version 2.0, for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */
#include "client/mysqltest/regular_expressions.h"
#include "my_compiler.h"
#include "mysql/strings/m_ctype.h"
[[noreturn]] extern void die(const char *fmt, ...)
MY_ATTRIBUTE((format(printf, 1, 2)));
/*
Filter for queries that can be run using the
MySQL Prepared Statements C API.
*/
static const char *const ps_re_str =
"^("
"[[:space:]]*REPLACE[[:space:]]|"
"[[:space:]]*INSERT[[:space:]]|"
"[[:space:]]*UPDATE[[:space:]]|"
"[[:space:]]*DELETE[[:space:]]|"
"[[:space:]]*SELECT[[:space:]]|"
"[[:space:]]*CREATE[[:space:]]+DATABASE[[:space:]]|"
"[[:space:]]*CREATE[[:space:]]+INDEX[[:space:]]|"
"[[:space:]]*CREATE[[:space:]]+TABLE[[:space:]]|"
"[[:space:]]*CREATE[[:space:]]+USER[[:space:]]|"
"[[:space:]]*CREATE[[:space:]]+TEMPORARY[[:space:]]+TABLE[[:space:]]|"
"[[:space:]]*DROP[[:space:]]+DATABASE[[:space:]]|"
"[[:space:]]*DROP[[:space:]]+INDEX[[:space:]]|"
"[[:space:]]*DROP[[:space:]]+TABLE[[:space:]]|"
"[[:space:]]*DROP[[:space:]]+USER[[:space:]]|"
"[[:space:]]*DROP[[:space:]]+VIEW[[:space:]]|"
"[[:space:]]*DROP[[:space:]]+TEMPORARY[[:space:]]+TABLE[[:space:]]|"
"[[:space:]]*ALTER[[:space:]]+USER[[:space:]]|"
"[[:space:]]*RENAME[[:space:]]+TABLE[[:space:]]|"
"[[:space:]]*RENAME[[:space:]]+USER[[:space:]]|"
"[[:space:]]*TRUNCATE[[:space:]]+TABLE[[:space:]]|"
"[[:space:]]*ANALYZE[[:space:]]+TABLE[[:space:]]|"
"[[:space:]]*CHECKSUM[[:space:]]+TABLE[[:space:]]|"
"[[:space:]]*CHECKSUM[[:space:]]+TABLES[[:space:]]|"
"[[:space:]]*OPTIMIZE[[:space:]]+TABLE[[:space:]]|"
"[[:space:]]*REPAIR[[:space:]]+TABLE[[:space:]]|"
"[[:space:]]*GRANT[[:space:]]|"
"[[:space:]]*KILL[[:space:]]|"
"[[:space:]]*REVOKE[[:space:]]+ALL[[:space:]]+PRIVILEGES[[:space:]]|"
"[[:space:]]*DO[[:space:]]|"
"[[:space:]]*CALL[[:space:]]|"
"[[:space:]]*COMMIT[[:space:]]|"
"[[:space:]]*SET[[:space:]]+OPTION[[:space:]]|"
"[[:space:]]*SHOW[[:space:]]+CREATE[[:space:]]+TABLE[[:space:]]|"
"[[:space:]]*SHOW[[:space:]]+CREATE[[:space:]]+PROCEDURE[[:space:]]|"
"[[:space:]]*SHOW[[:space:]]+CREATE[[:space:]]+FUNCTION[[:space:]]|"
"[[:space:]]*SHOW[[:space:]]+CREATE[[:space:]]+VIEW[[:space:]]|"
"[[:space:]]*SHOW[[:space:]]+CREATE[[:space:]]+EVENT[[:space:]]|"
"[[:space:]]*INSTALL[[:space:]]+PLUGIN[[:space:]]|"
"[[:space:]]*UNINSTALL[[:space:]]+PLUGIN[[:space:]]|"
"[[:space:]]*RESET[[:space:]]+MASTER[[:space:]]|"
"[[:space:]]*RESET[[:space:]]+SLAVE[[:space:]]|"
"[[:space:]]*RESET[[:space:]]+QUERY[[:space:]]+CACHE[[:space:]]|"
"[[:space:]]*SHOW[[:space:]]+BINLOG[[:space:]]+EVENTS[[:space:]]|"
"[[:space:]]*SHOW[[:space:]]+MASTER[[:space:]]+LOGS[[:space:]]|"
"[[:space:]]*SHOW[[:space:]]+MASTER[[:space:]]+STATUS[[:space:]]|"
"[[:space:]]*SHOW[[:space:]]+BINARY[[:space:]]+LOGS[[:space:]]|"
"[[:space:]]*SHOW[[:space:]]+SLAVE[[:space:]]+STATUS[[:space:]]|"
"[[:space:]]*SLAVE[[:space:]]+START[[:space:]]|"
"[[:space:]]*SLAVE[[:space:]]+STOP[[:space:]]|"
"[[:space:]]*DELETE[[:space:]]+MULTI[[:space:]]|"
"[[:space:]]*UPDATE[[:space:]]+MULTI[[:space:]]|"
"[[:space:]]*INSERT[[:space:]]+SELECT[[:space:]])";
/*
Filter for queries that can be run using the
Stored procedures.
*/
static const char *const sp_re_str = ps_re_str;
/*
Filter for queries that can be run as views.
*/
static const char *const view_re_str =
"^("
"[[:space:]]*SELECT[[:space:]])";
const char *const opt_trace_re_str =
"^("
"[[:space:]]*INSERT[[:space:]]|"
"[[:space:]]*UPDATE[[:space:]]|"
"[[:space:]]*DELETE[[:space:]]|"
"[[:space:]]*EXPLAIN[[:space:]]|"
"[[:space:]]*SELECT[[:space:]])";
/* Filter for queries that can be converted to EXPLAIN. */
static const char *const explain_re_str =
"^("
"[[:space:]]*(SELECT|DELETE|UPDATE|INSERT|REPLACE)[[:space:]])";
/* Precompiled regular expressions. */
std::regex ps_re(ps_re_str,
std::regex_constants::nosubs | std::regex_constants::icase);
std::regex sp_re(sp_re_str,
std::regex_constants::nosubs | std::regex_constants::icase);
std::regex view_re(view_re_str,
std::regex_constants::nosubs | std::regex_constants::icase);
std::regex opt_trace_re(opt_trace_re_str, std::regex_constants::nosubs |
std::regex_constants::icase);
std::regex explain_re(explain_re_str, std::regex_constants::nosubs |
std::regex_constants::icase);
extern CHARSET_INFO *charset_info;
/**
Execute all substitutions on val.
@param[in] val Pointer to the character string to be used as
input for the regex replace operation.
@param[in,out] r Pointer to the st_replace_regex structure which
holds arguments and information for the command.
@param[in,out] len Pointer to variable holding length of input string.
@retval True If substituition was made.
@retval False If no substituition was made.
@note
r->buf points at the resulting buffer with all substitutions done.
len points at length of resulting buffer.
r->even_buf and r->odd_buf might have been reallocated.
r->even_buf_len and r->odd_buf_len might have been changed.
@todo
At some point figure out if there is a way to do everything in one pass.
*/
int multi_reg_replace(struct st_replace_regex *r, char *val, size_t *len) {
size_t i;
char *in_buf, *out_buf;
int *buf_len_p;
in_buf = val;
out_buf = r->even_buf;
buf_len_p = &r->even_buf_len;
r->buf = nullptr;
/*
For each substitution, perform replacement only if the input buffer
is not empty.
*/
if (*len > 0) {
for (i = 0; i < r->regex_arr.size(); i++) {
try {
struct st_regex const re(r->regex_arr[i]);
char *save_out_buf = out_buf;
std::regex const rpat(re.pattern, (re.icase == 0)
? std::regex_constants::ECMAScript
: std::regex_constants::icase);
std::string sin = std::string(in_buf, *len);
std::string sout;
/*
We use iterators instead of using the input buffer directly as
it may include the null character (0x00) and characters succeeding
them will be ignored unless we specify the start and end positions
of the input string explicitly.
*/
std::regex_replace(std::back_inserter(sout), sin.begin(), sin.end(),
rpat, re.replace, std::regex_constants::format_sed);
/*
If some replacement is performed, write the replaced string into the
output buffer.
*/
if (sout != sin) {
*len = sout.length();
if (*len >= (uint)*buf_len_p) {
uint const need_buf_len = (*len) + 1;
out_buf = (char *)my_realloc(PSI_NOT_INSTRUMENTED, out_buf,
need_buf_len, MYF(MY_WME + MY_FAE));
*buf_len_p = need_buf_len;
}
// Copy result to output buffer.
strncpy(out_buf, sout.c_str(), *len + 1);
// If the buffer has been reallocated, make adjustments
if (save_out_buf != out_buf) {
if (save_out_buf == r->even_buf)
r->even_buf = out_buf;
else
r->odd_buf = out_buf;
}
r->buf = out_buf;
if (in_buf == val) in_buf = r->odd_buf;
std::swap(in_buf, out_buf);
buf_len_p =
(out_buf == r->even_buf) ? &r->even_buf_len : &r->odd_buf_len;
}
} catch (const std::regex_error &e) {
die("Error in replace_regex for `/%s/%s/` : %s",
(r->regex_arr[i]).pattern, (r->regex_arr[i]).replace, e.what());
}
}
}
return (r->buf == nullptr);
}
/**
Function to check if a protocol's regular expression matches the query
string.
@param re Pointer to a precompiled regular expression.
@param str Pointer to character string in which the pattern needs to be
searched.
@retval 1 If the pattern is found.
@retval 0 If the pattern is not found.
*/
int search_protocol_re(std::regex *re, const char *str) {
while (my_isspace(charset_info, *str)) str++;
if (str[0] == '/' && str[1] == '*') {
const char *comm_end = strstr(str, "*/");
if (!comm_end) die("Statement is unterminated comment");
str = comm_end + 2;
}
// Check if statement matches the pattern string
if (std::regex_search(str, *re, std::regex_constants::match_continuous)) {
/*
Simulate the "[^;]*$" check which follows the SQL prefix
in the regex used to filter statements to be run with ps/
sp protocol as using it directly in the regex is currently
not possible due to an issue in the standard regex library.
*/
if ((re == &ps_re || re == &sp_re) && strchr(str, ';') != nullptr) return 0;
// Match found
return 1;
}
return 0;
}