1
/* -*- mode: c++; c-basic-offset: 2; indent-tabs-mode: nil; -*-
2
* vim:expandtab:shiftwidth=2:tabstop=2:smarttab:
4
* Copyright (C) 2008,2009 Sun Microsystems
6
* This program is free software; you can redistribute it and/or modify
7
* it under the terms of the GNU General Public License as published by
8
* the Free Software Foundation; version 2 of the License.
10
* This program is distributed in the hope that it will be useful,
11
* but WITHOUT ANY WARRANTY; without even the implied warranty of
12
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13
* GNU General Public License for more details.
15
* You should have received a copy of the GNU General Public License
16
* along with this program; if not, write to the Free Software
17
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
21
#include <drizzled/plugin/logging.h>
22
#include <drizzled/gettext.h>
23
#include <drizzled/session.h>
27
#include <sys/types.h>
32
using namespace drizzled;
34
/* TODO make this dynamic as needed */
35
static const int MAX_MSG_LEN= 32*1024;
37
static bool sysvar_logging_query_enable= false;
38
static char* sysvar_logging_query_filename= NULL;
39
static char* sysvar_logging_query_pcre= NULL;
40
/* TODO fix these to not be unsigned long once we have sensible sys_var system */
41
static unsigned long sysvar_logging_query_threshold_slow= 0;
42
static unsigned long sysvar_logging_query_threshold_big_resultset= 0;
43
static unsigned long sysvar_logging_query_threshold_big_examined= 0;
45
/* stolen from mysys/my_getsystime
46
until the Session has a good utime "now" we can use
47
will have to use this instead */
49
static uint64_t get_microtime()
51
#if defined(HAVE_GETHRTIME)
52
return gethrtime()/1000;
57
The following loop is here because gettimeofday may fail on some systems
59
while (gettimeofday(&t, NULL) != 0) {}
60
newtime= (uint64_t)t.tv_sec * 1000000 + t.tv_usec;
62
#endif /* defined(HAVE_GETHRTIME) */
65
/* quote a string to be safe to include in a CSV line
66
that means backslash quoting all commas, doublequotes, backslashes,
67
and all the ASCII unprintable characters
68
as long as we pass the high-bit bytes unchanged
69
this is safe to do to a UTF8 string
70
we dont allow overrunning the targetbuffer
71
to avoid having a very long query overwrite memory
73
TODO consider remapping the unprintables instead to "Printable
74
Representation", the Unicode characters from the area U+2400 to
75
U+2421 reserved for representing control characters when it is
76
necessary to print or display them rather than have them perform
77
their intended function.
81
static unsigned char *quotify (const unsigned char *src, size_t srclen,
82
unsigned char *dst, size_t dstlen)
84
static const char hexit[]= { '0', '1', '2', '3', '4', '5', '6', '7',
85
'8', '9', 'a', 'b', 'c', 'd', 'e', 'f' };
86
size_t dst_ndx; /* ndx down the dst */
87
size_t src_ndx; /* ndx down the src */
92
for (dst_ndx= 0,src_ndx= 0; src_ndx < srclen; src_ndx++)
95
/* Worst case, need 5 dst bytes for the next src byte.
96
backslash x hexit hexit null
97
so if not enough room, just terminate the string and return
99
if ((dstlen - dst_ndx) < 5)
101
dst[dst_ndx]= (unsigned char)0x00;
105
if (src[src_ndx] > 0x7f)
107
// pass thru high bit characters, they are non-ASCII UTF8 Unicode
108
dst[dst_ndx++]= src[src_ndx];
110
else if (src[src_ndx] == 0x00) // null
112
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= (unsigned char) '0';
114
else if (src[src_ndx] == 0x07) // bell
116
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= (unsigned char) 'a';
118
else if (src[src_ndx] == 0x08) // backspace
120
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= (unsigned char) 'b';
122
else if (src[src_ndx] == 0x09) // horiz tab
124
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= (unsigned char) 't';
126
else if (src[src_ndx] == 0x0a) // line feed
128
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= (unsigned char) 'n';
130
else if (src[src_ndx] == 0x0b) // vert tab
132
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= (unsigned char) 'v';
134
else if (src[src_ndx] == 0x0c) // formfeed
136
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= (unsigned char) 'f';
138
else if (src[src_ndx] == 0x0d) // carrage return
140
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= (unsigned char) 'r';
142
else if (src[src_ndx] == 0x1b) // escape
144
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= (unsigned char) 'e';
146
else if (src[src_ndx] == 0x22) // quotation mark
148
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= 0x22;
150
else if (src[src_ndx] == 0x2C) // comma
152
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= 0x2C;
154
else if (src[src_ndx] == 0x5C) // backslash
156
dst[dst_ndx++]= 0x5C; dst[dst_ndx++]= 0x5C;
158
else if ((src[src_ndx] < 0x20) || (src[src_ndx] == 0x7F)) // other unprintable ASCII
160
dst[dst_ndx++]= 0x5C;
161
dst[dst_ndx++]= (unsigned char) 'x';
162
dst[dst_ndx++]= hexit[(src[src_ndx] >> 4) & 0x0f];
163
dst[dst_ndx++]= hexit[src[src_ndx] & 0x0f];
165
else // everything else
167
dst[dst_ndx++]= src[src_ndx];
175
class Logging_query: public drizzled::plugin::Logging
184
: drizzled::plugin::Logging("Logging_query"),
185
fd(-1), re(NULL), pe(NULL)
188
/* if there is no destination filename, dont bother doing anything */
189
if (sysvar_logging_query_filename == NULL)
192
fd= open(sysvar_logging_query_filename,
193
O_WRONLY | O_APPEND | O_CREAT,
197
errmsg_printf(ERRMSG_LVL_ERROR, _("fail open() fn=%s er=%s\n"),
198
sysvar_logging_query_filename,
203
if (sysvar_logging_query_pcre != NULL)
205
const char *this_pcre_error;
206
int this_pcre_erroffset;
207
re= pcre_compile(sysvar_logging_query_pcre, 0, &this_pcre_error,
208
&this_pcre_erroffset, NULL);
209
pe= pcre_study(re, 0, &this_pcre_error);
210
/* TODO emit error messages if there is a problem */
233
virtual bool pre (Session *)
235
/* we could just not have a pre entrypoint at all,
236
and have logging_pre == NULL
237
but we have this here for the sake of being an example */
241
virtual bool post (Session *session)
243
char msgbuf[MAX_MSG_LEN];
247
assert(session != NULL);
252
/* Yes, we know that checking sysvar_logging_query_enable,
253
sysvar_logging_query_threshold_big_resultset, and
254
sysvar_logging_query_threshold_big_examined is not threadsafe,
255
because some other thread might change these sysvars. But we
256
don't care. We might start logging a little late as it spreads
257
to other threads. Big deal. */
259
// return if not enabled or query was too fast or resultset was too small
260
if (sysvar_logging_query_enable == false)
262
if (session->sent_row_count < sysvar_logging_query_threshold_big_resultset)
264
if (session->examined_row_count < sysvar_logging_query_threshold_big_examined)
267
/* TODO, the session object should have a "utime command completed"
268
inside itself, so be more accurate, and so this doesnt have to
269
keep calling current_utime, which can be slow */
271
uint64_t t_mark= get_microtime();
273
if ((t_mark - session->start_utime) < (sysvar_logging_query_threshold_slow))
279
this_pcre_rc = pcre_exec(re, pe, session->query.c_str(), session->query.length(), 0, 0, NULL, 0);
280
if (this_pcre_rc < 0)
284
// buffer to quotify the query
285
unsigned char qs[255];
287
// to avoid trying to printf %s something that is potentially NULL
288
const char *dbs= session->db.empty() ? "" : session->db.c_str();
291
snprintf(msgbuf, MAX_MSG_LEN,
292
"%"PRIu64",%"PRIu64",%"PRIu64",\"%.*s\",\"%s\",\"%.*s\","
293
"%"PRIu64",%"PRIu64",%"PRIu64",%"PRIu64",%"PRIu64","
294
"%"PRIu32",%"PRIu32",%"PRIu32",\"%s\"\n",
297
session->getQueryId(),
298
// dont need to quote the db name, always CSV safe
299
(int)session->db.length(), dbs,
300
// do need to quote the query
301
quotify((unsigned char *)session->getQueryString().c_str(),
302
session->getQueryLength(), qs, sizeof(qs)),
303
// command_name is defined in drizzled/sql_parse.cc
304
// dont need to quote the command name, always CSV safe
305
(int)command_name[session->command].length,
306
command_name[session->command].str,
307
// counters are at end, to make it easier to add more
308
(t_mark - session->getConnectMicroseconds()),
309
(t_mark - session->start_utime),
310
(t_mark - session->utime_after_lock),
311
session->sent_row_count,
312
session->examined_row_count,
314
session->total_warn_count,
315
session->getServerId(),
319
// a single write has a kernel thread lock, thus no need mutex guard this
320
wrv= write(fd, msgbuf, msgbuf_len);
321
assert(wrv == msgbuf_len);
327
static Logging_query *handler= NULL;
329
static int logging_query_plugin_init(drizzled::plugin::Registry ®istry)
331
handler= new Logging_query();
332
registry.add(handler);
337
static int logging_query_plugin_deinit(drizzled::plugin::Registry ®istry)
339
registry.remove(handler);
345
static DRIZZLE_SYSVAR_BOOL(
347
sysvar_logging_query_enable,
349
N_("Enable logging to CSV file"),
350
NULL, /* check func */
351
NULL, /* update func */
352
false /* default */);
354
static DRIZZLE_SYSVAR_STR(
356
sysvar_logging_query_filename,
358
N_("File to log to"),
359
NULL, /* check func */
360
NULL, /* update func*/
363
static DRIZZLE_SYSVAR_STR(
365
sysvar_logging_query_pcre,
367
N_("PCRE to match the query against"),
368
NULL, /* check func */
369
NULL, /* update func*/
372
static DRIZZLE_SYSVAR_ULONG(
374
sysvar_logging_query_threshold_slow,
376
N_("Threshold for logging slow queries, in microseconds"),
377
NULL, /* check func */
378
NULL, /* update func */
381
UINT32_MAX, /* max */
384
static DRIZZLE_SYSVAR_ULONG(
385
threshold_big_resultset,
386
sysvar_logging_query_threshold_big_resultset,
388
N_("Threshold for logging big queries, for rows returned"),
389
NULL, /* check func */
390
NULL, /* update func */
393
UINT32_MAX, /* max */
396
static DRIZZLE_SYSVAR_ULONG(
397
threshold_big_examined,
398
sysvar_logging_query_threshold_big_examined,
400
N_("Threshold for logging big queries, for rows examined"),
401
NULL, /* check func */
402
NULL, /* update func */
405
UINT32_MAX, /* max */
408
static drizzle_sys_var* logging_query_system_variables[]= {
409
DRIZZLE_SYSVAR(enable),
410
DRIZZLE_SYSVAR(filename),
411
DRIZZLE_SYSVAR(pcre),
412
DRIZZLE_SYSVAR(threshold_slow),
413
DRIZZLE_SYSVAR(threshold_big_resultset),
414
DRIZZLE_SYSVAR(threshold_big_examined),
418
DRIZZLE_DECLARE_PLUGIN
423
"Mark Atwood <mark@fallenpegasus.com>",
424
N_("Log queries to a CSV file"),
426
logging_query_plugin_init,
427
logging_query_plugin_deinit,
428
logging_query_system_variables,
431
DRIZZLE_DECLARE_PLUGIN_END;