~drizzle-trunk/drizzle/development

641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
1
/*****************************************************************************
2
3
Copyright (c) 1995, 2009, Innobase Oy. All Rights Reserved.
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
4
Copyright (c) 2008, 2009 Google Inc.
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
5
6
Portions of this file contain modifications contributed and copyrighted by
7
Google, Inc. Those modifications are gratefully acknowledged and are described
8
briefly in the InnoDB documentation. The contributions by Google are
9
incorporated with their permission, and subject to the conditions contained in
10
the file COPYING.Google.
11
12
This program is free software; you can redistribute it and/or modify it under
13
the terms of the GNU General Public License as published by the Free Software
14
Foundation; version 2 of the License.
15
16
This program is distributed in the hope that it will be useful, but WITHOUT
17
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
18
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
19
20
You should have received a copy of the GNU General Public License along with
1802.10.2 by Monty Taylor
Update all of the copyright headers to include the correct address.
21
this program; if not, write to the Free Software Foundation, Inc., 51 Franklin
22
St, Fifth Floor, Boston, MA 02110-1301 USA
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
23
24
*****************************************************************************/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
25
/***********************************************************************
26
27
Copyright (c) 1995, 2009, Innobase Oy. All Rights Reserved.
28
Copyright (c) 2009, Percona Inc.
29
30
Portions of this file contain modifications contributed and copyrighted
31
by Percona Inc.. Those modifications are
32
gratefully acknowledged and are described briefly in the InnoDB
33
documentation. The contributions by Percona Inc. are incorporated with
34
their permission, and subject to the conditions contained in the file
35
COPYING.Percona.
36
37
This program is free software; you can redistribute it and/or modify it
38
under the terms of the GNU General Public License as published by the
39
Free Software Foundation; version 2 of the License.
40
41
This program is distributed in the hope that it will be useful, but
42
WITHOUT ANY WARRANTY; without even the implied warranty of
43
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
44
Public License for more details.
45
46
You should have received a copy of the GNU General Public License along
47
with this program; if not, write to the Free Software Foundation, Inc.,
1802.10.2 by Monty Taylor
Update all of the copyright headers to include the correct address.
48
51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
49
50
***********************************************************************/
51
52
/**************************************************//**
53
@file srv/srv0srv.c
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
54
The database server main program
55
56
NOTE: SQL Server 7 uses something which the documentation
57
calls user mode scheduled threads (UMS threads). One such
58
thread is usually allocated per processor. Win32
59
documentation does not know any UMS threads, which suggests
60
that the concept is internal to SQL Server 7. It may mean that
61
SQL Server 7 does all the scheduling of threads itself, even
62
in i/o waits. We should maybe modify InnoDB to use the same
63
technique, because thread switches within NT may be too slow.
64
65
SQL Server 7 also mentions fibers, which are cooperatively
66
scheduled threads. They can boost performance by 5 %,
67
according to the Delaney and Soukup's book.
68
69
Windows 2000 will have something called thread pooling
70
(see msdn website), which we could possibly use.
71
72
Another possibility could be to use some very fast user space
73
thread library. This might confuse NT though.
74
75
Created 10/8/1995 Heikki Tuuri
76
*******************************************************/
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
77
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
78
/* Dummy comment */
79
#include "srv0srv.h"
80
81
#include "ut0mem.h"
82
#include "ut0ut.h"
83
#include "os0proc.h"
84
#include "mem0mem.h"
85
#include "mem0pool.h"
86
#include "sync0sync.h"
87
#include "thr0loc.h"
88
#include "que0que.h"
89
#include "srv0que.h"
90
#include "log0recv.h"
91
#include "pars0pars.h"
92
#include "usr0sess.h"
93
#include "lock0lock.h"
94
#include "trx0purge.h"
95
#include "ibuf0ibuf.h"
96
#include "buf0flu.h"
97
#include "buf0lru.h"
98
#include "btr0sea.h"
99
#include "dict0load.h"
100
#include "dict0boot.h"
101
#include "srv0start.h"
102
#include "row0mysql.h"
103
#include "ha_prototypes.h"
104
#include "trx0i_s.h"
1819.5.54 by stewart at flamingspork
[patch 054/129] Merge patch for revision 1845 from InnoDB SVN:
105
#include "os0sync.h" /* for HAVE_ATOMIC_BUILTINS */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
106
107
/* This is set to TRUE if the MySQL user has set it in MySQL; currently
108
affects only FOREIGN KEY definition parsing */
109
UNIV_INTERN ibool	srv_lower_case_table_names	= FALSE;
110
111
/* The following counter is incremented whenever there is some user activity
112
in the server */
113
UNIV_INTERN ulint	srv_activity_count	= 0;
114
115
/* The following is the maximum allowed duration of a lock wait. */
116
UNIV_INTERN ulint	srv_fatal_semaphore_wait_threshold = 600;
117
118
/* How much data manipulation language (DML) statements need to be delayed,
119
in microseconds, in order to reduce the lagging of the purge thread. */
120
UNIV_INTERN ulint	srv_dml_needed_delay = 0;
121
122
UNIV_INTERN ibool	srv_lock_timeout_and_monitor_active = FALSE;
123
UNIV_INTERN ibool	srv_error_monitor_active = FALSE;
124
125
UNIV_INTERN const char*	srv_main_thread_op_info = "";
126
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
127
/** Prefix used by MySQL to indicate pre-5.1 table name encoding */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
128
UNIV_INTERN const char	srv_mysql50_table_name_prefix[9] = "#mysql50#";
129
130
/* Server parameters which are read from the initfile */
131
132
/* The following three are dir paths which are catenated before file
133
names, where the file name itself may also contain a path */
134
135
UNIV_INTERN char*	srv_data_home	= NULL;
136
#ifdef UNIV_LOG_ARCHIVE
137
UNIV_INTERN char*	srv_arch_dir	= NULL;
138
#endif /* UNIV_LOG_ARCHIVE */
139
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
140
/** store to its own file each table created by an user; data
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
141
dictionary tables are in the system tablespace 0 */
142
UNIV_INTERN my_bool	srv_file_per_table;
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
143
/** The file format to use on new *.ibd files. */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
144
UNIV_INTERN ulint	srv_file_format = 0;
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
145
/** Whether to check file format during startup.  A value of
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
146
DICT_TF_FORMAT_MAX + 1 means no checking ie. FALSE.  The default is to
147
set it to the highest format we support. */
148
UNIV_INTERN ulint	srv_check_file_format_at_startup = DICT_TF_FORMAT_MAX;
149
150
#if DICT_TF_FORMAT_51
151
# error "DICT_TF_FORMAT_51 must be 0!"
152
#endif
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
153
/** Place locks to records only i.e. do not use next-key locking except
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
154
on duplicate key checking and foreign key checking */
155
UNIV_INTERN ibool	srv_locks_unsafe_for_binlog = FALSE;
156
157
UNIV_INTERN ulint	srv_n_data_files = 0;
158
UNIV_INTERN char**	srv_data_file_names = NULL;
159
/* size in database pages */
160
UNIV_INTERN ulint*	srv_data_file_sizes = NULL;
161
162
/* if TRUE, then we auto-extend the last data file */
163
UNIV_INTERN ibool	srv_auto_extend_last_data_file	= FALSE;
164
/* if != 0, this tells the max size auto-extending may increase the
165
last data file size */
166
UNIV_INTERN ulint	srv_last_file_size_max	= 0;
167
/* If the last data file is auto-extended, we add this
168
many pages to it at a time */
937.3.4 by Stewart Smith
fix innodb_autoextend_increment for sparc
169
UNIV_INTERN unsigned int srv_auto_extend_increment = 8;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
170
UNIV_INTERN ulint*	srv_data_file_is_raw_partition = NULL;
171
172
/* If the following is TRUE we do not allow inserts etc. This protects
173
the user from forgetting the 'newraw' keyword to my.cnf */
174
175
UNIV_INTERN ibool	srv_created_new_raw	= FALSE;
176
177
UNIV_INTERN char**	srv_log_group_home_dirs = NULL;
178
179
UNIV_INTERN ulint	srv_n_log_groups	= ULINT_MAX;
180
UNIV_INTERN ulint	srv_n_log_files		= ULINT_MAX;
181
/* size in database pages */
182
UNIV_INTERN ulint	srv_log_file_size	= ULINT_MAX;
183
/* size in database pages */
184
UNIV_INTERN ulint	srv_log_buffer_size	= ULINT_MAX;
185
UNIV_INTERN ulong	srv_flush_log_at_trx_commit = 1;
186
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
187
/* Try to flush dirty pages so as to avoid IO bursts at
188
the checkpoints. */
1114.1.1 by Monty Taylor
Merged InnoDB Plugin 1.0.4
189
UNIV_INTERN bool	srv_adaptive_flushing	= TRUE;
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
190
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
191
/* The sort order table of the MySQL latin1_swedish_ci character set
192
collation */
1114.1.1 by Monty Taylor
Merged InnoDB Plugin 1.0.4
193
#if defined(BUILD_DRIZZLE)
641.1.4 by Monty Taylor
Merged in InnoDB changes.
194
UNIV_INTERN const byte	srv_latin1_ordering[256]	/* The sort order table of the latin1
195
					character set. The following table is
196
					the MySQL order as of Feb 10th, 2002 */
197
= {
198
  0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07
199
, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F
200
, 0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17
201
, 0x18, 0x19, 0x1A, 0x1B, 0x1C, 0x1D, 0x1E, 0x1F
202
, 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27
203
, 0x28, 0x29, 0x2A, 0x2B, 0x2C, 0x2D, 0x2E, 0x2F
204
, 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37
205
, 0x38, 0x39, 0x3A, 0x3B, 0x3C, 0x3D, 0x3E, 0x3F
206
, 0x40, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47
207
, 0x48, 0x49, 0x4A, 0x4B, 0x4C, 0x4D, 0x4E, 0x4F
208
, 0x50, 0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57
209
, 0x58, 0x59, 0x5A, 0x5B, 0x5C, 0x5D, 0x5E, 0x5F
210
, 0x60, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47
211
, 0x48, 0x49, 0x4A, 0x4B, 0x4C, 0x4D, 0x4E, 0x4F
212
, 0x50, 0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57
213
, 0x58, 0x59, 0x5A, 0x7B, 0x7C, 0x7D, 0x7E, 0x7F
214
, 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87
215
, 0x88, 0x89, 0x8A, 0x8B, 0x8C, 0x8D, 0x8E, 0x8F
216
, 0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97
217
, 0x98, 0x99, 0x9A, 0x9B, 0x9C, 0x9D, 0x9E, 0x9F
218
, 0xA0, 0xA1, 0xA2, 0xA3, 0xA4, 0xA5, 0xA6, 0xA7
219
, 0xA8, 0xA9, 0xAA, 0xAB, 0xAC, 0xAD, 0xAE, 0xAF
220
, 0xB0, 0xB1, 0xB2, 0xB3, 0xB4, 0xB5, 0xB6, 0xB7
221
, 0xB8, 0xB9, 0xBA, 0xBB, 0xBC, 0xBD, 0xBE, 0xBF
222
, 0x41, 0x41, 0x41, 0x41, 0x5C, 0x5B, 0x5C, 0x43
223
, 0x45, 0x45, 0x45, 0x45, 0x49, 0x49, 0x49, 0x49
224
, 0x44, 0x4E, 0x4F, 0x4F, 0x4F, 0x4F, 0x5D, 0xD7
225
, 0xD8, 0x55, 0x55, 0x55, 0x59, 0x59, 0xDE, 0xDF
226
, 0x41, 0x41, 0x41, 0x41, 0x5C, 0x5B, 0x5C, 0x43
227
, 0x45, 0x45, 0x45, 0x45, 0x49, 0x49, 0x49, 0x49
228
, 0x44, 0x4E, 0x4F, 0x4F, 0x4F, 0x4F, 0x5D, 0xF7
229
, 0xD8, 0x55, 0x55, 0x55, 0x59, 0x59, 0xDE, 0xFF
230
};
1114.1.1 by Monty Taylor
Merged InnoDB Plugin 1.0.4
231
#else
232
UNIV_INTERN const byte*        srv_latin1_ordering;
233
#endif /* BUILD_DRIZZLE */
641.1.4 by Monty Taylor
Merged in InnoDB changes.
234
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
235
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
236
/* use os/external memory allocator */
237
UNIV_INTERN my_bool	srv_use_sys_malloc	= TRUE;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
238
/* requested size in kilobytes */
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
239
UNIV_INTERN ulint	srv_buf_pool_size	= ULINT_MAX;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
240
/* previously requested size */
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
241
UNIV_INTERN ulint	srv_buf_pool_old_size;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
242
/* current size in kilobytes */
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
243
UNIV_INTERN ulint	srv_buf_pool_curr_size	= 0;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
244
/* size in bytes */
245
UNIV_INTERN ulint	srv_mem_pool_size	= ULINT_MAX;
246
UNIV_INTERN ulint	srv_lock_table_size	= ULINT_MAX;
247
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
248
/* This parameter is deprecated. Use srv_n_io_[read|write]_threads
249
instead. */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
250
UNIV_INTERN ulint	srv_n_file_io_threads	= ULINT_MAX;
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
251
UNIV_INTERN ulint	srv_n_read_io_threads	= ULINT_MAX;
252
UNIV_INTERN ulint	srv_n_write_io_threads	= ULINT_MAX;
253
254
/* User settable value of the number of pages that must be present
255
in the buffer cache and accessed sequentially for InnoDB to trigger a
256
readahead request. */
257
UNIV_INTERN ulong	srv_read_ahead_threshold	= 56;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
258
259
#ifdef UNIV_LOG_ARCHIVE
260
UNIV_INTERN ibool		srv_log_archive_on	= FALSE;
261
UNIV_INTERN ibool		srv_archive_recovery	= 0;
262
UNIV_INTERN ib_uint64_t	srv_archive_recovery_limit_lsn;
263
#endif /* UNIV_LOG_ARCHIVE */
264
265
/* This parameter is used to throttle the number of insert buffers that are
266
merged in a batch. By increasing this parameter on a faster disk you can
267
possibly reduce the number of I/O operations performed to complete the
268
merge operation. The value of this parameter is used as is by the
269
background loop when the system is idle (low load), on a busy system
270
the parameter is scaled down by a factor of 4, this is to avoid putting
271
a heavier load on the I/O sub system. */
272
273
UNIV_INTERN ulong	srv_insert_buffer_batch_size = 20;
274
275
UNIV_INTERN char*	srv_file_flush_method_str = NULL;
276
UNIV_INTERN ulint	srv_unix_file_flush_method = SRV_UNIX_FSYNC;
277
UNIV_INTERN ulint	srv_win_file_flush_method = SRV_WIN_IO_UNBUFFERED;
278
279
UNIV_INTERN ulint	srv_max_n_open_files	  = 300;
280
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
281
/* Number of IO operations per second the server can do */
282
UNIV_INTERN ulong	srv_io_capacity         = 200;
283
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
284
/* The InnoDB main thread tries to keep the ratio of modified pages
285
in the buffer pool to all database pages in the buffer pool smaller than
286
the following number. But it is not guaranteed that the value stays below
287
that during a time of heavy update/insert activity. */
288
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
289
UNIV_INTERN ulong	srv_max_buf_pool_modified_pct	= 75;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
290
291
/* variable counts amount of data read in total (in bytes) */
292
UNIV_INTERN ulint srv_data_read = 0;
293
294
/* here we count the amount of data written in total (in bytes) */
295
UNIV_INTERN ulint srv_data_written = 0;
296
297
/* the number of the log write requests done */
298
UNIV_INTERN ulint srv_log_write_requests = 0;
299
300
/* the number of physical writes to the log performed */
301
UNIV_INTERN ulint srv_log_writes = 0;
302
303
/* amount of data written to the log files in bytes */
304
UNIV_INTERN ulint srv_os_log_written = 0;
305
306
/* amount of writes being done to the log files */
307
UNIV_INTERN ulint srv_os_log_pending_writes = 0;
308
309
/* we increase this counter, when there we don't have enough space in the
310
log buffer and have to flush it */
311
UNIV_INTERN ulint srv_log_waits = 0;
312
313
/* this variable counts the amount of times, when the doublewrite buffer
314
was flushed */
315
UNIV_INTERN ulint srv_dblwr_writes = 0;
316
317
/* here we store the number of pages that have been flushed to the
318
doublewrite buffer */
319
UNIV_INTERN ulint srv_dblwr_pages_written = 0;
320
321
/* in this variable we store the number of write requests issued */
322
UNIV_INTERN ulint srv_buf_pool_write_requests = 0;
323
324
/* here we store the number of times when we had to wait for a free page
325
in the buffer pool. It happens when the buffer pool is full and we need
326
to make a flush, in order to be able to read or create a page. */
327
UNIV_INTERN ulint srv_buf_pool_wait_free = 0;
328
329
/* variable to count the number of pages that were written from buffer
330
pool to the disk */
331
UNIV_INTERN ulint srv_buf_pool_flushed = 0;
332
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
333
/** Number of buffer pool reads that led to the
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
334
reading of a disk page */
335
UNIV_INTERN ulint srv_buf_pool_reads = 0;
336
337
/* structure to pass status variables to MySQL */
338
UNIV_INTERN export_struc export_vars;
339
340
/* If the following is != 0 we do not allow inserts etc. This protects
341
the user from forgetting the innodb_force_recovery keyword to my.cnf */
342
343
UNIV_INTERN ulint	srv_force_recovery	= 0;
344
/*-----------------------*/
345
/* We are prepared for a situation that we have this many threads waiting for
346
a semaphore inside InnoDB. innobase_start_or_create_for_mysql() sets the
347
value. */
348
349
UNIV_INTERN ulint	srv_max_n_threads	= 0;
350
351
/* The following controls how many threads we let inside InnoDB concurrently:
352
threads waiting for locks are not counted into the number because otherwise
353
we could get a deadlock. MySQL creates a thread for each user session, and
354
semaphore contention and convoy problems can occur withput this restriction.
355
Value 10 should be good if there are less than 4 processors + 4 disks in the
356
computer. Bigger computers need bigger values. Value 0 will disable the
357
concurrency check. */
358
359
UNIV_INTERN ulong	srv_thread_concurrency	= 0;
360
361
/* this mutex protects srv_conc data structures */
362
UNIV_INTERN os_fast_mutex_t	srv_conc_mutex;
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
363
/* number of transactions that have declared_to_be_inside_innodb set.
364
It used to be a non-error for this value to drop below zero temporarily.
365
This is no longer true. We'll, however, keep the lint datatype to add
366
assertions to catch any corner cases that we may have missed. */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
367
UNIV_INTERN lint	srv_conc_n_threads	= 0;
368
/* number of OS threads waiting in the FIFO for a permission to enter
369
InnoDB */
370
UNIV_INTERN ulint	srv_conc_n_waiting_threads = 0;
371
372
typedef struct srv_conc_slot_struct	srv_conc_slot_t;
373
struct srv_conc_slot_struct{
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
374
	os_event_t			event;		/*!< event to wait */
375
	ibool				reserved;	/*!< TRUE if slot
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
376
							reserved */
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
377
	ibool				wait_ended;	/*!< TRUE when another
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
378
							thread has already set
379
							the event and the
380
							thread in this slot is
381
							free to proceed; but
382
							reserved may still be
383
							TRUE at that point */
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
384
	UT_LIST_NODE_T(srv_conc_slot_t)	srv_conc_queue;	/*!< queue node */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
385
};
386
387
/* queue of threads waiting to get in */
388
UNIV_INTERN UT_LIST_BASE_NODE_T(srv_conc_slot_t)	srv_conc_queue;
389
/* array of wait slots */
390
UNIV_INTERN srv_conc_slot_t* srv_conc_slots;
391
392
/* Number of times a thread is allowed to enter InnoDB within the same
393
SQL query after it has once got the ticket at srv_conc_enter_innodb */
394
#define SRV_FREE_TICKETS_TO_ENTER srv_n_free_tickets_to_enter
395
#define SRV_THREAD_SLEEP_DELAY srv_thread_sleep_delay
396
/*-----------------------*/
397
/* If the following is set to 1 then we do not run purge and insert buffer
398
merge to completion before shutdown. If it is set to 2, do not even flush the
399
buffer pool to data files at the shutdown: we effectively 'crash'
400
InnoDB (but lose no committed transactions). */
401
UNIV_INTERN ulint	srv_fast_shutdown	= 0;
402
403
/* Generate a innodb_status.<pid> file */
404
UNIV_INTERN ibool	srv_innodb_status	= FALSE;
405
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
406
/* When estimating number of different key values in an index, sample
407
this many index pages */
641.3.9 by Monty Taylor
More removal of my_malloc.
408
UNIV_INTERN ib_uint64_t	srv_stats_sample_pages = 8;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
409
410
UNIV_INTERN ibool	srv_use_doublewrite_buf	= TRUE;
411
UNIV_INTERN ibool	srv_use_checksums = TRUE;
412
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
413
UNIV_INTERN ulong	srv_replication_delay		= 0;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
414
415
/*-------------------------------------------*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
416
UNIV_INTERN ulong	srv_n_spin_wait_rounds	= 30;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
417
UNIV_INTERN ulong	srv_n_free_tickets_to_enter = 500;
418
UNIV_INTERN ulong	srv_thread_sleep_delay = 10000;
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
419
UNIV_INTERN ulong	srv_spin_wait_delay	= 6;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
420
UNIV_INTERN ibool	srv_priority_boost	= TRUE;
421
422
#ifdef UNIV_DEBUG
423
UNIV_INTERN ibool	srv_print_thread_releases	= FALSE;
424
UNIV_INTERN ibool	srv_print_lock_waits		= FALSE;
425
UNIV_INTERN ibool	srv_print_buf_io		= FALSE;
426
UNIV_INTERN ibool	srv_print_log_io		= FALSE;
427
UNIV_INTERN ibool	srv_print_latch_waits		= FALSE;
428
#endif /* UNIV_DEBUG */
429
430
UNIV_INTERN ulint		srv_n_rows_inserted		= 0;
431
UNIV_INTERN ulint		srv_n_rows_updated		= 0;
432
UNIV_INTERN ulint		srv_n_rows_deleted		= 0;
433
UNIV_INTERN ulint		srv_n_rows_read			= 0;
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
434
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
435
static ulint	srv_n_rows_inserted_old		= 0;
436
static ulint	srv_n_rows_updated_old		= 0;
437
static ulint	srv_n_rows_deleted_old		= 0;
438
static ulint	srv_n_rows_read_old		= 0;
439
440
UNIV_INTERN ulint		srv_n_lock_wait_count		= 0;
441
UNIV_INTERN ulint		srv_n_lock_wait_current_count	= 0;
442
UNIV_INTERN ib_int64_t	srv_n_lock_wait_time		= 0;
443
UNIV_INTERN ulint		srv_n_lock_max_wait_time	= 0;
444
445
446
/*
447
  Set the following to 0 if you want InnoDB to write messages on
448
  stderr on startup/shutdown
449
*/
450
UNIV_INTERN ibool	srv_print_verbose_log		= TRUE;
451
UNIV_INTERN ibool	srv_print_innodb_monitor	= FALSE;
452
UNIV_INTERN ibool	srv_print_innodb_lock_monitor	= FALSE;
453
UNIV_INTERN ibool	srv_print_innodb_tablespace_monitor = FALSE;
454
UNIV_INTERN ibool	srv_print_innodb_table_monitor = FALSE;
455
456
/* Array of English strings describing the current state of an
457
i/o handler thread */
458
459
UNIV_INTERN const char* srv_io_thread_op_info[SRV_MAX_N_IO_THREADS];
460
UNIV_INTERN const char* srv_io_thread_function[SRV_MAX_N_IO_THREADS];
461
462
UNIV_INTERN time_t	srv_last_monitor_time;
463
464
UNIV_INTERN mutex_t	srv_innodb_monitor_mutex;
465
466
/* Mutex for locking srv_monitor_file */
467
UNIV_INTERN mutex_t	srv_monitor_file_mutex;
468
/* Temporary file for innodb monitor output */
469
UNIV_INTERN FILE*	srv_monitor_file;
470
/* Mutex for locking srv_dict_tmpfile.
471
This mutex has a very high rank; threads reserving it should not
472
be holding any InnoDB latches. */
473
UNIV_INTERN mutex_t	srv_dict_tmpfile_mutex;
474
/* Temporary file for output from the data dictionary */
475
UNIV_INTERN FILE*	srv_dict_tmpfile;
476
/* Mutex for locking srv_misc_tmpfile.
477
This mutex has a very low rank; threads reserving it should not
478
acquire any further latches or sleep before releasing this one. */
479
UNIV_INTERN mutex_t	srv_misc_tmpfile_mutex;
480
/* Temporary file for miscellanous diagnostic output */
481
UNIV_INTERN FILE*	srv_misc_tmpfile;
482
483
UNIV_INTERN ulint	srv_main_thread_process_no	= 0;
484
UNIV_INTERN ulint	srv_main_thread_id		= 0;
485
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
486
/* The following count work done by srv_master_thread. */
487
488
/* Iterations by the 'once per second' loop. */
489
static ulint   srv_main_1_second_loops		= 0;
490
/* Calls to sleep by the 'once per second' loop. */
491
static ulint   srv_main_sleeps			= 0;
492
/* Iterations by the 'once per 10 seconds' loop. */
493
static ulint   srv_main_10_second_loops		= 0;
494
/* Iterations of the loop bounded by the 'background_loop' label. */
495
static ulint   srv_main_background_loops	= 0;
496
/* Iterations of the loop bounded by the 'flush_loop' label. */
497
static ulint   srv_main_flush_loops		= 0;
498
/* Log writes involving flush. */
499
static ulint   srv_log_writes_and_flush		= 0;
500
501
/* This is only ever touched by the master thread. It records the
502
time when the last flush of log file has happened. The master
503
thread ensures that we flush the log files at least once per
504
second. */
505
static time_t	srv_last_log_flush_time;
506
507
/* The master thread performs various tasks based on the current
508
state of IO activity and the level of IO utilization is past
509
intervals. Following macros define thresholds for these conditions. */
510
#define SRV_PEND_IO_THRESHOLD	(PCT_IO(3))
511
#define SRV_RECENT_IO_ACTIVITY	(PCT_IO(5))
512
#define SRV_PAST_IO_ACTIVITY	(PCT_IO(200))
513
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
514
/*
515
	IMPLEMENTATION OF THE SERVER MAIN PROGRAM
516
	=========================================
517
518
There is the following analogue between this database
519
server and an operating system kernel:
520
521
DB concept			equivalent OS concept
522
----------			---------------------
523
transaction		--	process;
524
525
query thread		--	thread;
526
527
lock			--	semaphore;
528
529
transaction set to
530
the rollback state	--	kill signal delivered to a process;
531
532
kernel			--	kernel;
533
534
query thread execution:
535
(a) without kernel mutex
536
reserved		--	process executing in user mode;
537
(b) with kernel mutex reserved
538
			--	process executing in kernel mode;
539
540
The server is controlled by a master thread which runs at
541
a priority higher than normal, that is, higher than user threads.
542
It sleeps most of the time, and wakes up, say, every 300 milliseconds,
543
to check whether there is anything happening in the server which
544
requires intervention of the master thread. Such situations may be,
545
for example, when flushing of dirty blocks is needed in the buffer
546
pool or old version of database rows have to be cleaned away.
547
548
The threads which we call user threads serve the queries of
549
the clients and input from the console of the server.
550
They run at normal priority. The server may have several
551
communications endpoints. A dedicated set of user threads waits
552
at each of these endpoints ready to receive a client request.
553
Each request is taken by a single user thread, which then starts
554
processing and, when the result is ready, sends it to the client
555
and returns to wait at the same endpoint the thread started from.
556
557
So, we do not have dedicated communication threads listening at
558
the endpoints and dealing the jobs to dedicated worker threads.
559
Our architecture saves one thread swithch per request, compared
560
to the solution with dedicated communication threads
561
which amounts to 15 microseconds on 100 MHz Pentium
562
running NT. If the client
563
is communicating over a network, this saving is negligible, but
564
if the client resides in the same machine, maybe in an SMP machine
565
on a different processor from the server thread, the saving
566
can be important as the threads can communicate over shared
567
memory with an overhead of a few microseconds.
568
569
We may later implement a dedicated communication thread solution
570
for those endpoints which communicate over a network.
571
572
Our solution with user threads has two problems: for each endpoint
573
there has to be a number of listening threads. If there are many
574
communication endpoints, it may be difficult to set the right number
575
of concurrent threads in the system, as many of the threads
576
may always be waiting at less busy endpoints. Another problem
577
is queuing of the messages, as the server internally does not
578
offer any queue for jobs.
579
580
Another group of user threads is intended for splitting the
581
queries and processing them in parallel. Let us call these
582
parallel communication threads. These threads are waiting for
583
parallelized tasks, suspended on event semaphores.
584
585
A single user thread waits for input from the console,
586
like a command to shut the database.
587
588
Utility threads are a different group of threads which takes
589
care of the buffer pool flushing and other, mainly background
590
operations, in the server.
591
Some of these utility threads always run at a lower than normal
592
priority, so that they are always in background. Some of them
593
may dynamically boost their priority by the pri_adjust function,
594
even to higher than normal priority, if their task becomes urgent.
595
The running of utilities is controlled by high- and low-water marks
596
of urgency. The urgency may be measured by the number of dirty blocks
597
in the buffer pool, in the case of the flush thread, for example.
598
When the high-water mark is exceeded, an utility starts running, until
599
the urgency drops under the low-water mark. Then the utility thread
600
suspend itself to wait for an event. The master thread is
601
responsible of signaling this event when the utility thread is
602
again needed.
603
604
For each individual type of utility, some threads always remain
605
at lower than normal priority. This is because pri_adjust is implemented
606
so that the threads at normal or higher priority control their
607
share of running time by calling sleep. Thus, if the load of the
608
system sudenly drops, these threads cannot necessarily utilize
609
the system fully. The background priority threads make up for this,
610
starting to run when the load drops.
611
612
When there is no activity in the system, also the master thread
613
suspends itself to wait for an event making
614
the server totally silent. The responsibility to signal this
615
event is on the user thread which again receives a message
616
from a client.
617
618
There is still one complication in our server design. If a
619
background utility thread obtains a resource (e.g., mutex) needed by a user
620
thread, and there is also some other user activity in the system,
621
the user thread may have to wait indefinitely long for the
622
resource, as the OS does not schedule a background thread if
623
there is some other runnable user thread. This problem is called
624
priority inversion in real-time programming.
625
626
One solution to the priority inversion problem would be to
627
keep record of which thread owns which resource and
628
in the above case boost the priority of the background thread
629
so that it will be scheduled and it can release the resource.
630
This solution is called priority inheritance in real-time programming.
631
A drawback of this solution is that the overhead of acquiring a mutex
632
increases slightly, maybe 0.2 microseconds on a 100 MHz Pentium, because
633
the thread has to call os_thread_get_curr_id.
634
This may be compared to 0.5 microsecond overhead for a mutex lock-unlock
635
pair. Note that the thread
636
cannot store the information in the resource, say mutex, itself,
637
because competing threads could wipe out the information if it is
638
stored before acquiring the mutex, and if it stored afterwards,
639
the information is outdated for the time of one machine instruction,
640
at least. (To be precise, the information could be stored to
641
lock_word in mutex if the machine supports atomic swap.)
642
643
The above solution with priority inheritance may become actual in the
644
future, but at the moment we plan to implement a more coarse solution,
645
which could be called a global priority inheritance. If a thread
646
has to wait for a long time, say 300 milliseconds, for a resource,
647
we just guess that it may be waiting for a resource owned by a background
648
thread, and boost the the priority of all runnable background threads
649
to the normal level. The background threads then themselves adjust
650
their fixed priority back to background after releasing all resources
651
they had (or, at some fixed points in their program code).
652
653
What is the performance of the global priority inheritance solution?
654
We may weigh the length of the wait time 300 milliseconds, during
655
which the system processes some other thread
656
to the cost of boosting the priority of each runnable background
657
thread, rescheduling it, and lowering the priority again.
658
On 100 MHz Pentium + NT this overhead may be of the order 100
659
microseconds per thread. So, if the number of runnable background
660
threads is not very big, say < 100, the cost is tolerable.
661
Utility threads probably will access resources used by
662
user threads not very often, so collisions of user threads
663
to preempted utility threads should not happen very often.
664
665
The thread table contains
666
information of the current status of each thread existing in the system,
667
and also the event semaphores used in suspending the master thread
668
and utility and parallel communication threads when they have nothing to do.
669
The thread table can be seen as an analogue to the process table
670
in a traditional Unix implementation.
671
672
The thread table is also used in the global priority inheritance
673
scheme. This brings in one additional complication: threads accessing
674
the thread table must have at least normal fixed priority,
675
because the priority inheritance solution does not work if a background
676
thread is preempted while possessing the mutex protecting the thread table.
677
So, if a thread accesses the thread table, its priority has to be
678
boosted at least to normal. This priority requirement can be seen similar to
679
the privileged mode used when processing the kernel calls in traditional
680
Unix.*/
681
682
/* Thread slot in the thread table */
683
struct srv_slot_struct{
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
684
	os_thread_id_t	id;		/*!< thread id */
685
	os_thread_t	handle;		/*!< thread handle */
686
	unsigned	type:3;		/*!< thread type: user, utility etc. */
687
	unsigned	in_use:1;	/*!< TRUE if this slot is in use */
688
	unsigned	suspended:1;	/*!< TRUE if the thread is waiting
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
689
					for the event of this slot */
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
690
	ib_time_t	suspend_time;	/*!< time when the thread was
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
691
					suspended */
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
692
	os_event_t	event;		/*!< event used in suspending the
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
693
					thread when it has nothing to do */
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
694
	que_thr_t*	thr;		/*!< suspended query thread (only
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
695
					used for MySQL threads) */
696
};
697
698
/* Table for MySQL threads where they will be suspended to wait for locks */
699
UNIV_INTERN srv_slot_t*	srv_mysql_table = NULL;
700
701
UNIV_INTERN os_event_t	srv_lock_timeout_thread_event;
702
703
UNIV_INTERN srv_sys_t*	srv_sys	= NULL;
704
705
/* padding to prevent other memory update hotspots from residing on
706
the same memory cache line */
707
UNIV_INTERN byte	srv_pad1[64];
708
/* mutex protecting the server, trx structs, query threads, and lock table */
709
UNIV_INTERN mutex_t*	kernel_mutex_temp;
710
/* padding to prevent other memory update hotspots from residing on
711
the same memory cache line */
712
UNIV_INTERN byte	srv_pad2[64];
713
714
#if 0
715
/* The following three values measure the urgency of the jobs of
716
buffer, version, and insert threads. They may vary from 0 - 1000.
717
The server mutex protects all these variables. The low-water values
718
tell that the server can acquiesce the utility when the value
719
drops below this low-water mark. */
720
721
static ulint	srv_meter[SRV_MASTER + 1];
722
static ulint	srv_meter_low_water[SRV_MASTER + 1];
723
static ulint	srv_meter_high_water[SRV_MASTER + 1];
724
static ulint	srv_meter_high_water2[SRV_MASTER + 1];
725
static ulint	srv_meter_foreground[SRV_MASTER + 1];
726
#endif
727
728
/* The following values give info about the activity going on in
729
the database. They are protected by the server mutex. The arrays
730
are indexed by the type of the thread. */
731
732
UNIV_INTERN ulint	srv_n_threads_active[SRV_MASTER + 1];
733
UNIV_INTERN ulint	srv_n_threads[SRV_MASTER + 1];
734
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
735
/***********************************************************************
736
Prints counters for work done by srv_master_thread. */
737
static
738
void
739
srv_print_master_thread_info(
740
/*=========================*/
741
	FILE  *file)    /* in: output stream */
742
{
743
	fprintf(file, "srv_master_thread loops: %lu 1_second, %lu sleeps, "
744
		"%lu 10_second, %lu background, %lu flush\n",
745
		srv_main_1_second_loops, srv_main_sleeps,
746
		srv_main_10_second_loops, srv_main_background_loops,
747
		srv_main_flush_loops);
1819.5.19 by stewart at flamingspork
[patch 019/129] Merge patch for revision 1805 from InnoDB SVN:
748
	fprintf(file, "srv_master_thread log flush and writes: %lu\n",
749
		      srv_log_writes_and_flush);
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
750
}
751
752
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
753
Sets the info describing an i/o thread current state. */
754
UNIV_INTERN
755
void
756
srv_set_io_thread_op_info(
757
/*======================*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
758
	ulint		i,	/*!< in: the 'segment' of the i/o thread */
759
	const char*	str)	/*!< in: constant char string describing the
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
760
				state */
761
{
762
	ut_a(i < SRV_MAX_N_IO_THREADS);
763
764
	srv_io_thread_op_info[i] = str;
765
}
766
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
767
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
768
Accessor function to get pointer to n'th slot in the server thread
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
769
table.
770
@return	pointer to the slot */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
771
static
772
srv_slot_t*
773
srv_table_get_nth_slot(
774
/*===================*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
775
	ulint	index)		/*!< in: index of the slot */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
776
{
777
	ut_a(index < OS_THREAD_MAX_N);
778
779
	return(srv_sys->threads + index);
780
}
781
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
782
/*********************************************************************//**
783
Gets the number of threads in the system.
784
@return	sum of srv_n_threads[] */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
785
UNIV_INTERN
786
ulint
787
srv_get_n_threads(void)
788
/*===================*/
789
{
790
	ulint	i;
791
	ulint	n_threads	= 0;
792
793
	mutex_enter(&kernel_mutex);
794
795
	for (i = SRV_COM; i < SRV_MASTER + 1; i++) {
796
797
		n_threads += srv_n_threads[i];
798
	}
799
800
	mutex_exit(&kernel_mutex);
801
802
	return(n_threads);
803
}
804
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
805
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
806
Reserves a slot in the thread table for the current thread. Also creates the
807
thread local storage struct for the current thread. NOTE! The server mutex
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
808
has to be reserved by the caller!
809
@return	reserved slot index */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
810
static
811
ulint
812
srv_table_reserve_slot(
813
/*===================*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
814
	enum srv_thread_type	type)	/*!< in: type of the thread */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
815
{
816
	srv_slot_t*	slot;
817
	ulint		i;
818
819
	ut_a(type > 0);
820
	ut_a(type <= SRV_MASTER);
821
822
	i = 0;
823
	slot = srv_table_get_nth_slot(i);
824
825
	while (slot->in_use) {
826
		i++;
827
		slot = srv_table_get_nth_slot(i);
828
	}
829
830
	ut_a(slot->in_use == FALSE);
831
832
	slot->in_use = TRUE;
833
	slot->suspended = FALSE;
834
	slot->type = type;
835
	slot->id = os_thread_get_curr_id();
836
	slot->handle = os_thread_get_curr();
837
838
	thr_local_create();
839
840
	thr_local_set_slot_no(os_thread_get_curr_id(), i);
841
842
	return(i);
843
}
844
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
845
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
846
Suspends the calling thread to wait for the event in its thread slot.
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
847
NOTE! The server mutex has to be reserved by the caller!
848
@return	event for the calling thread to wait */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
849
static
850
os_event_t
851
srv_suspend_thread(void)
852
/*====================*/
853
{
854
	srv_slot_t*		slot;
855
	os_event_t		event;
856
	ulint			slot_no;
857
	enum srv_thread_type	type;
858
859
	ut_ad(mutex_own(&kernel_mutex));
860
861
	slot_no = thr_local_get_slot_no(os_thread_get_curr_id());
862
863
	if (srv_print_thread_releases) {
864
		fprintf(stderr,
865
			"Suspending thread %lu to slot %lu\n",
866
			(ulong) os_thread_get_curr_id(), (ulong) slot_no);
867
	}
868
869
	slot = srv_table_get_nth_slot(slot_no);
870
871
	type = slot->type;
872
873
	ut_ad(type >= SRV_WORKER);
874
	ut_ad(type <= SRV_MASTER);
875
876
	event = slot->event;
877
878
	slot->suspended = TRUE;
879
880
	ut_ad(srv_n_threads_active[type] > 0);
881
882
	srv_n_threads_active[type]--;
883
884
	os_event_reset(event);
885
886
	return(event);
887
}
888
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
889
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
890
Releases threads of the type given from suspension in the thread table.
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
891
NOTE! The server mutex has to be reserved by the caller!
892
@return number of threads released: this may be less than n if not
893
enough threads were suspended at the moment */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
894
UNIV_INTERN
895
ulint
896
srv_release_threads(
897
/*================*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
898
	enum srv_thread_type	type,	/*!< in: thread type */
899
	ulint			n)	/*!< in: number of threads to release */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
900
{
901
	srv_slot_t*	slot;
902
	ulint		i;
903
	ulint		count	= 0;
904
905
	ut_ad(type >= SRV_WORKER);
906
	ut_ad(type <= SRV_MASTER);
907
	ut_ad(n > 0);
908
	ut_ad(mutex_own(&kernel_mutex));
909
910
	for (i = 0; i < OS_THREAD_MAX_N; i++) {
911
912
		slot = srv_table_get_nth_slot(i);
913
914
		if (slot->in_use && slot->type == type && slot->suspended) {
915
916
			slot->suspended = FALSE;
917
918
			srv_n_threads_active[type]++;
919
920
			os_event_set(slot->event);
921
922
			if (srv_print_thread_releases) {
923
				fprintf(stderr,
924
					"Releasing thread %lu type %lu"
925
					" from slot %lu\n",
926
					(ulong) slot->id, (ulong) type,
927
					(ulong) i);
928
			}
929
930
			count++;
931
932
			if (count == n) {
933
				break;
934
			}
935
		}
936
	}
937
938
	return(count);
939
}
940
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
941
/*********************************************************************//**
942
Returns the calling thread type.
943
@return	SRV_COM, ... */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
944
UNIV_INTERN
945
enum srv_thread_type
946
srv_get_thread_type(void)
947
/*=====================*/
948
{
949
	ulint			slot_no;
950
	srv_slot_t*		slot;
951
	enum srv_thread_type	type;
952
953
	mutex_enter(&kernel_mutex);
954
955
	slot_no = thr_local_get_slot_no(os_thread_get_curr_id());
956
957
	slot = srv_table_get_nth_slot(slot_no);
958
959
	type = slot->type;
960
961
	ut_ad(type >= SRV_WORKER);
962
	ut_ad(type <= SRV_MASTER);
963
964
	mutex_exit(&kernel_mutex);
965
966
	return(type);
967
}
968
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
969
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
970
Initializes the server. */
971
UNIV_INTERN
972
void
973
srv_init(void)
974
/*==========*/
975
{
976
	srv_conc_slot_t*	conc_slot;
977
	srv_slot_t*		slot;
978
	ulint			i;
979
980
	srv_sys = mem_alloc(sizeof(srv_sys_t));
981
982
	kernel_mutex_temp = mem_alloc(sizeof(mutex_t));
983
	mutex_create(&kernel_mutex, SYNC_KERNEL);
984
985
	mutex_create(&srv_innodb_monitor_mutex, SYNC_NO_ORDER_CHECK);
986
987
	srv_sys->threads = mem_alloc(OS_THREAD_MAX_N * sizeof(srv_slot_t));
988
989
	for (i = 0; i < OS_THREAD_MAX_N; i++) {
990
		slot = srv_table_get_nth_slot(i);
991
		slot->in_use = FALSE;
992
		slot->type=0;	/* Avoid purify errors */
993
		slot->event = os_event_create(NULL);
994
		ut_a(slot->event);
995
	}
996
997
	srv_mysql_table = mem_alloc(OS_THREAD_MAX_N * sizeof(srv_slot_t));
998
999
	for (i = 0; i < OS_THREAD_MAX_N; i++) {
1000
		slot = srv_mysql_table + i;
1001
		slot->in_use = FALSE;
1002
		slot->type = 0;
1003
		slot->event = os_event_create(NULL);
1004
		ut_a(slot->event);
1005
	}
1006
1007
	srv_lock_timeout_thread_event = os_event_create(NULL);
1008
1009
	for (i = 0; i < SRV_MASTER + 1; i++) {
1010
		srv_n_threads_active[i] = 0;
1011
		srv_n_threads[i] = 0;
1012
#if 0
1013
		srv_meter[i] = 30;
1014
		srv_meter_low_water[i] = 50;
1015
		srv_meter_high_water[i] = 100;
1016
		srv_meter_high_water2[i] = 200;
1017
		srv_meter_foreground[i] = 250;
1018
#endif
1019
	}
1020
1021
	UT_LIST_INIT(srv_sys->tasks);
1022
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1023
	/* Create dummy indexes for infimum and supremum records */
1024
1025
	dict_ind_init();
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1026
1027
	/* Init the server concurrency restriction data structures */
1028
1029
	os_fast_mutex_init(&srv_conc_mutex);
1030
1031
	UT_LIST_INIT(srv_conc_queue);
1032
1033
	srv_conc_slots = mem_alloc(OS_THREAD_MAX_N * sizeof(srv_conc_slot_t));
1034
1035
	for (i = 0; i < OS_THREAD_MAX_N; i++) {
1036
		conc_slot = srv_conc_slots + i;
1037
		conc_slot->reserved = FALSE;
1038
		conc_slot->event = os_event_create(NULL);
1039
		ut_a(conc_slot->event);
1040
	}
1041
1042
	/* Initialize some INFORMATION SCHEMA internal structures */
1043
	trx_i_s_cache_init(trx_i_s_cache);
1044
}
1045
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1046
/*********************************************************************//**
1819.5.106 by stewart at flamingspork
[patch 106/129] Merge patch for revision 1915 from InnoDB SVN:
1047
Frees the data structures created in srv_init(). */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1048
UNIV_INTERN
1049
void
1050
srv_free(void)
1051
/*==========*/
1052
{
1053
	os_fast_mutex_free(&srv_conc_mutex);
1819.5.106 by stewart at flamingspork
[patch 106/129] Merge patch for revision 1915 from InnoDB SVN:
1054
	mem_free(srv_conc_slots);
1055
	srv_conc_slots = NULL;
1056
1057
	mem_free(srv_sys->threads);
1058
	mem_free(srv_sys);
1059
	srv_sys = NULL;
1060
1061
	mem_free(kernel_mutex_temp);
1062
	kernel_mutex_temp = NULL;
1063
	mem_free(srv_mysql_table);
1064
	srv_mysql_table = NULL;
1065
1066
	trx_i_s_cache_free(trx_i_s_cache);
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1067
}
1068
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1069
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1070
Initializes the synchronization primitives, memory system, and the thread
1071
local storage. */
1072
UNIV_INTERN
1073
void
1074
srv_general_init(void)
1075
/*==================*/
1076
{
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
1077
	ut_mem_init();
1819.5.106 by stewart at flamingspork
[patch 106/129] Merge patch for revision 1915 from InnoDB SVN:
1078
	/* Reset the system variables in the recovery module. */
1079
	recv_sys_var_init();
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1080
	os_sync_init();
1081
	sync_init();
1082
	mem_init(srv_mem_pool_size);
1083
	thr_local_init();
1084
}
1085
1086
/*======================= InnoDB Server FIFO queue =======================*/
1087
1088
/* Maximum allowable purge history length.  <=0 means 'infinite'. */
1089
UNIV_INTERN ulong	srv_max_purge_lag		= 0;
1090
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1091
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1092
Puts an OS thread to wait if there are too many concurrent threads
1093
(>= srv_thread_concurrency) inside InnoDB. The threads wait in a FIFO queue. */
1094
UNIV_INTERN
1095
void
1096
srv_conc_enter_innodb(
1097
/*==================*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1098
	trx_t*	trx)	/*!< in: transaction object associated with the
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1099
			thread */
1100
{
1101
	ibool			has_slept = FALSE;
1102
	srv_conc_slot_t*	slot	  = NULL;
1103
	ulint			i;
1104
1105
	if (trx->mysql_thd != NULL
1106
	    && thd_is_replication_slave_thread(trx->mysql_thd)) {
1107
1108
		UT_WAIT_FOR(srv_conc_n_threads
1109
			    < (lint)srv_thread_concurrency,
1110
			    srv_replication_delay * 1000);
1111
1112
		return;
1113
	}
1114
1115
	/* If trx has 'free tickets' to enter the engine left, then use one
1116
	such ticket */
1117
1118
	if (trx->n_tickets_to_enter_innodb > 0) {
1119
		trx->n_tickets_to_enter_innodb--;
1120
1121
		return;
1122
	}
1123
1124
	os_fast_mutex_lock(&srv_conc_mutex);
1125
retry:
1126
	if (trx->declared_to_be_inside_innodb) {
1127
		ut_print_timestamp(stderr);
1128
		fputs("  InnoDB: Error: trying to declare trx"
1129
		      " to enter InnoDB, but\n"
1130
		      "InnoDB: it already is declared.\n", stderr);
1131
		trx_print(stderr, trx, 0);
1132
		putc('\n', stderr);
1133
		os_fast_mutex_unlock(&srv_conc_mutex);
1134
1135
		return;
1136
	}
1137
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
1138
	ut_ad(srv_conc_n_threads >= 0);
1139
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1140
	if (srv_conc_n_threads < (lint)srv_thread_concurrency) {
1141
1142
		srv_conc_n_threads++;
1143
		trx->declared_to_be_inside_innodb = TRUE;
1144
		trx->n_tickets_to_enter_innodb = SRV_FREE_TICKETS_TO_ENTER;
1145
1146
		os_fast_mutex_unlock(&srv_conc_mutex);
1147
1148
		return;
1149
	}
1150
1151
	/* If the transaction is not holding resources, let it sleep
1152
	for SRV_THREAD_SLEEP_DELAY microseconds, and try again then */
1153
1154
	if (!has_slept && !trx->has_search_latch
1155
	    && NULL == UT_LIST_GET_FIRST(trx->trx_locks)) {
1156
1157
		has_slept = TRUE; /* We let it sleep only once to avoid
1158
				  starvation */
1159
1160
		srv_conc_n_waiting_threads++;
1161
1162
		os_fast_mutex_unlock(&srv_conc_mutex);
1163
1164
		trx->op_info = "sleeping before joining InnoDB queue";
1165
1166
		/* Peter Zaitsev suggested that we take the sleep away
1167
		altogether. But the sleep may be good in pathological
1168
		situations of lots of thread switches. Simply put some
1169
		threads aside for a while to reduce the number of thread
1170
		switches. */
1171
		if (SRV_THREAD_SLEEP_DELAY > 0) {
1172
			os_thread_sleep(SRV_THREAD_SLEEP_DELAY);
1173
		}
1174
1175
		trx->op_info = "";
1176
1177
		os_fast_mutex_lock(&srv_conc_mutex);
1178
1179
		srv_conc_n_waiting_threads--;
1180
1181
		goto retry;
1182
	}
1183
1184
	/* Too many threads inside: put the current thread to a queue */
1185
1186
	for (i = 0; i < OS_THREAD_MAX_N; i++) {
1187
		slot = srv_conc_slots + i;
1188
1189
		if (!slot->reserved) {
1190
1191
			break;
1192
		}
1193
	}
1194
1195
	if (i == OS_THREAD_MAX_N) {
1196
		/* Could not find a free wait slot, we must let the
1197
		thread enter */
1198
1199
		srv_conc_n_threads++;
1200
		trx->declared_to_be_inside_innodb = TRUE;
1201
		trx->n_tickets_to_enter_innodb = 0;
1202
1203
		os_fast_mutex_unlock(&srv_conc_mutex);
1204
1205
		return;
1206
	}
1207
1208
	/* Release possible search system latch this thread has */
1209
	if (trx->has_search_latch) {
1210
		trx_search_latch_release_if_reserved(trx);
1211
	}
1212
1213
	/* Add to the queue */
1214
	slot->reserved = TRUE;
1215
	slot->wait_ended = FALSE;
1216
1217
	UT_LIST_ADD_LAST(srv_conc_queue, srv_conc_queue, slot);
1218
1219
	os_event_reset(slot->event);
1220
1221
	srv_conc_n_waiting_threads++;
1222
1223
	os_fast_mutex_unlock(&srv_conc_mutex);
1224
1225
	/* Go to wait for the event; when a thread leaves InnoDB it will
1226
	release this thread */
1227
1228
	trx->op_info = "waiting in InnoDB queue";
1229
1230
	os_event_wait(slot->event);
1231
1232
	trx->op_info = "";
1233
1234
	os_fast_mutex_lock(&srv_conc_mutex);
1235
1236
	srv_conc_n_waiting_threads--;
1237
1238
	/* NOTE that the thread which released this thread already
1239
	incremented the thread counter on behalf of this thread */
1240
1241
	slot->reserved = FALSE;
1242
1243
	UT_LIST_REMOVE(srv_conc_queue, srv_conc_queue, slot);
1244
1245
	trx->declared_to_be_inside_innodb = TRUE;
1246
	trx->n_tickets_to_enter_innodb = SRV_FREE_TICKETS_TO_ENTER;
1247
1248
	os_fast_mutex_unlock(&srv_conc_mutex);
1249
}
1250
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1251
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1252
This lets a thread enter InnoDB regardless of the number of threads inside
1253
InnoDB. This must be called when a thread ends a lock wait. */
1254
UNIV_INTERN
1255
void
1256
srv_conc_force_enter_innodb(
1257
/*========================*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1258
	trx_t*	trx)	/*!< in: transaction object associated with the
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1259
			thread */
1260
{
1261
	if (UNIV_LIKELY(!srv_thread_concurrency)) {
1262
1263
		return;
1264
	}
1265
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
1266
	ut_ad(srv_conc_n_threads >= 0);
1267
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1268
	os_fast_mutex_lock(&srv_conc_mutex);
1269
1270
	srv_conc_n_threads++;
1271
	trx->declared_to_be_inside_innodb = TRUE;
1272
	trx->n_tickets_to_enter_innodb = 1;
1273
1274
	os_fast_mutex_unlock(&srv_conc_mutex);
1275
}
1276
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1277
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1278
This must be called when a thread exits InnoDB in a lock wait or at the
1279
end of an SQL statement. */
1280
UNIV_INTERN
1281
void
1282
srv_conc_force_exit_innodb(
1283
/*=======================*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1284
	trx_t*	trx)	/*!< in: transaction object associated with the
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1285
			thread */
1286
{
1287
	srv_conc_slot_t*	slot	= NULL;
1288
1289
	if (trx->mysql_thd != NULL
1290
	    && thd_is_replication_slave_thread(trx->mysql_thd)) {
1291
1292
		return;
1293
	}
1294
1295
	if (trx->declared_to_be_inside_innodb == FALSE) {
1296
1297
		return;
1298
	}
1299
1300
	os_fast_mutex_lock(&srv_conc_mutex);
1301
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
1302
	ut_ad(srv_conc_n_threads > 0);
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1303
	srv_conc_n_threads--;
1304
	trx->declared_to_be_inside_innodb = FALSE;
1305
	trx->n_tickets_to_enter_innodb = 0;
1306
1307
	if (srv_conc_n_threads < (lint)srv_thread_concurrency) {
1308
		/* Look for a slot where a thread is waiting and no other
1309
		thread has yet released the thread */
1310
1311
		slot = UT_LIST_GET_FIRST(srv_conc_queue);
1312
1313
		while (slot && slot->wait_ended == TRUE) {
1314
			slot = UT_LIST_GET_NEXT(srv_conc_queue, slot);
1315
		}
1316
1317
		if (slot != NULL) {
1318
			slot->wait_ended = TRUE;
1319
1320
			/* We increment the count on behalf of the released
1321
			thread */
1322
1323
			srv_conc_n_threads++;
1324
		}
1325
	}
1326
1327
	os_fast_mutex_unlock(&srv_conc_mutex);
1328
1329
	if (slot != NULL) {
1330
		os_event_set(slot->event);
1331
	}
1332
}
1333
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1334
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1335
This must be called when a thread exits InnoDB. */
1336
UNIV_INTERN
1337
void
1338
srv_conc_exit_innodb(
1339
/*=================*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1340
	trx_t*	trx)	/*!< in: transaction object associated with the
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1341
			thread */
1342
{
1343
	if (trx->n_tickets_to_enter_innodb > 0) {
1344
		/* We will pretend the thread is still inside InnoDB though it
1345
		now leaves the InnoDB engine. In this way we save
1346
		a lot of semaphore operations. srv_conc_force_exit_innodb is
1347
		used to declare the thread definitely outside InnoDB. It
1348
		should be called when there is a lock wait or an SQL statement
1349
		ends. */
1350
1351
		return;
1352
	}
1353
1354
	srv_conc_force_exit_innodb(trx);
1355
}
1356
1357
/*========================================================================*/
1358
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1359
/*********************************************************************//**
1360
Normalizes init parameter values to use units we use inside InnoDB.
1361
@return	DB_SUCCESS or error code */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1362
static
1363
ulint
1364
srv_normalize_init_values(void)
1365
/*===========================*/
1366
{
1367
	ulint	n;
1368
	ulint	i;
1369
1370
	n = srv_n_data_files;
1371
1372
	for (i = 0; i < n; i++) {
1373
		srv_data_file_sizes[i] = srv_data_file_sizes[i]
1374
			* ((1024 * 1024) / UNIV_PAGE_SIZE);
1375
	}
1376
1377
	srv_last_file_size_max = srv_last_file_size_max
1378
		* ((1024 * 1024) / UNIV_PAGE_SIZE);
1379
1380
	srv_log_file_size = srv_log_file_size / UNIV_PAGE_SIZE;
1381
1382
	srv_log_buffer_size = srv_log_buffer_size / UNIV_PAGE_SIZE;
1383
1384
	srv_lock_table_size = 5 * (srv_buf_pool_size / UNIV_PAGE_SIZE);
1385
1386
	return(DB_SUCCESS);
1387
}
1388
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1389
/*********************************************************************//**
1390
Boots the InnoDB server.
1391
@return	DB_SUCCESS or error code */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1392
UNIV_INTERN
1393
ulint
1394
srv_boot(void)
1395
/*==========*/
1396
{
1397
	ulint	err;
1398
1399
	/* Transform the init parameter values given by MySQL to
1400
	use units we use inside InnoDB: */
1401
1402
	err = srv_normalize_init_values();
1403
1404
	if (err != DB_SUCCESS) {
1405
		return(err);
1406
	}
1407
1408
	/* Initialize synchronization primitives, memory management, and thread
1409
	local storage */
1410
1411
	srv_general_init();
1412
1413
	/* Initialize this module */
1414
1415
	srv_init();
1416
1417
	return(DB_SUCCESS);
1418
}
1419
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1420
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1421
Reserves a slot in the thread table for the current MySQL OS thread.
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1422
NOTE! The kernel mutex has to be reserved by the caller!
1423
@return	reserved slot */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1424
static
1425
srv_slot_t*
1426
srv_table_reserve_slot_for_mysql(void)
1427
/*==================================*/
1428
{
1429
	srv_slot_t*	slot;
1430
	ulint		i;
1431
1432
	ut_ad(mutex_own(&kernel_mutex));
1433
1434
	i = 0;
1435
	slot = srv_mysql_table + i;
1436
1437
	while (slot->in_use) {
1438
		i++;
1439
1440
		if (i >= OS_THREAD_MAX_N) {
1441
1442
			ut_print_timestamp(stderr);
1443
1444
			fprintf(stderr,
1445
				"  InnoDB: There appear to be %lu MySQL"
1446
				" threads currently waiting\n"
1447
				"InnoDB: inside InnoDB, which is the"
1448
				" upper limit. Cannot continue operation.\n"
1449
				"InnoDB: We intentionally generate"
1450
				" a seg fault to print a stack trace\n"
1451
				"InnoDB: on Linux. But first we print"
1452
				" a list of waiting threads.\n", (ulong) i);
1453
1454
			for (i = 0; i < OS_THREAD_MAX_N; i++) {
1455
1456
				slot = srv_mysql_table + i;
1457
1458
				fprintf(stderr,
1459
					"Slot %lu: thread id %lu, type %lu,"
1460
					" in use %lu, susp %lu, time %lu\n",
1461
					(ulong) i,
1462
					(ulong) os_thread_pf(slot->id),
1463
					(ulong) slot->type,
1464
					(ulong) slot->in_use,
1465
					(ulong) slot->suspended,
1466
					(ulong) difftime(ut_time(),
1467
							 slot->suspend_time));
1468
			}
1469
1470
			ut_error;
1471
		}
1472
1473
		slot = srv_mysql_table + i;
1474
	}
1475
1476
	ut_a(slot->in_use == FALSE);
1477
1478
	slot->in_use = TRUE;
1479
	slot->id = os_thread_get_curr_id();
1480
	slot->handle = os_thread_get_curr();
1481
1482
	return(slot);
1483
}
1484
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1485
/***************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1486
Puts a MySQL OS thread to wait for a lock to be released. If an error
1487
occurs during the wait trx->error_state associated with thr is
1488
!= DB_SUCCESS when we return. DB_LOCK_WAIT_TIMEOUT and DB_DEADLOCK
1489
are possible errors. DB_DEADLOCK is returned if selective deadlock
1490
resolution chose this transaction as a victim. */
1491
UNIV_INTERN
1492
void
1493
srv_suspend_mysql_thread(
1494
/*=====================*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1495
	que_thr_t*	thr)	/*!< in: query thread associated with the MySQL
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1496
				OS thread */
1497
{
1498
	srv_slot_t*	slot;
1499
	os_event_t	event;
1500
	double		wait_time;
1501
	trx_t*		trx;
1502
	ulint		had_dict_lock;
1503
	ibool		was_declared_inside_innodb	= FALSE;
1504
	ib_int64_t	start_time			= 0;
1505
	ib_int64_t	finish_time;
1506
	ulint		diff_time;
1507
	ulint		sec;
1508
	ulint		ms;
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
1509
	ulong		lock_wait_timeout;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1510
1511
	ut_ad(!mutex_own(&kernel_mutex));
1512
1513
	trx = thr_get_trx(thr);
1514
1515
	os_event_set(srv_lock_timeout_thread_event);
1516
1517
	mutex_enter(&kernel_mutex);
1518
1519
	trx->error_state = DB_SUCCESS;
1520
1521
	if (thr->state == QUE_THR_RUNNING) {
1522
1523
		ut_ad(thr->is_active == TRUE);
1524
1525
		/* The lock has already been released or this transaction
1526
		was chosen as a deadlock victim: no need to suspend */
1527
1528
		if (trx->was_chosen_as_deadlock_victim) {
1529
1530
			trx->error_state = DB_DEADLOCK;
1531
			trx->was_chosen_as_deadlock_victim = FALSE;
1532
		}
1533
1534
		mutex_exit(&kernel_mutex);
1535
1536
		return;
1537
	}
1538
1539
	ut_ad(thr->is_active == FALSE);
1540
1541
	slot = srv_table_reserve_slot_for_mysql();
1542
1543
	event = slot->event;
1544
1545
	slot->thr = thr;
1546
1547
	os_event_reset(event);
1548
1549
	slot->suspend_time = ut_time();
1550
1551
	if (thr->lock_state == QUE_THR_LOCK_ROW) {
1552
		srv_n_lock_wait_count++;
1553
		srv_n_lock_wait_current_count++;
1554
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
1555
		if (ut_usectime(&sec, &ms) == -1) {
1556
			start_time = -1;
1557
		} else {
1558
			start_time = (ib_int64_t) sec * 1000000 + ms;
1559
		}
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1560
	}
1561
	/* Wake the lock timeout monitor thread, if it is suspended */
1562
1563
	os_event_set(srv_lock_timeout_thread_event);
1564
1565
	mutex_exit(&kernel_mutex);
1566
1567
	if (trx->declared_to_be_inside_innodb) {
1568
1569
		was_declared_inside_innodb = TRUE;
1570
1571
		/* We must declare this OS thread to exit InnoDB, since a
1572
		possible other thread holding a lock which this thread waits
1573
		for must be allowed to enter, sooner or later */
1574
1575
		srv_conc_force_exit_innodb(trx);
1576
	}
1577
1578
	had_dict_lock = trx->dict_operation_lock_mode;
1579
1580
	switch (had_dict_lock) {
1581
	case RW_S_LATCH:
1582
		/* Release foreign key check latch */
1583
		row_mysql_unfreeze_data_dictionary(trx);
1584
		break;
1585
	case RW_X_LATCH:
1586
		/* Release fast index creation latch */
1587
		row_mysql_unlock_data_dictionary(trx);
1588
		break;
1589
	}
1590
1591
	ut_a(trx->dict_operation_lock_mode == 0);
1592
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
1593
	/* Suspend this thread and wait for the event. */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1594
1595
	os_event_wait(event);
1596
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
1597
	/* After resuming, reacquire the data dictionary latch if
1598
	necessary. */
1599
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1600
	switch (had_dict_lock) {
1601
	case RW_S_LATCH:
1602
		row_mysql_freeze_data_dictionary(trx);
1603
		break;
1604
	case RW_X_LATCH:
1605
		row_mysql_lock_data_dictionary(trx);
1606
		break;
1607
	}
1608
1609
	if (was_declared_inside_innodb) {
1610
1611
		/* Return back inside InnoDB */
1612
1613
		srv_conc_force_enter_innodb(trx);
1614
	}
1615
1616
	mutex_enter(&kernel_mutex);
1617
1618
	/* Release the slot for others to use */
1619
1620
	slot->in_use = FALSE;
1621
1622
	wait_time = ut_difftime(ut_time(), slot->suspend_time);
1623
1624
	if (thr->lock_state == QUE_THR_LOCK_ROW) {
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
1625
		if (ut_usectime(&sec, &ms) == -1) {
1626
			finish_time = -1;
1627
		} else {
1628
			finish_time = (ib_int64_t) sec * 1000000 + ms;
1629
		}
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1630
1631
		diff_time = (ulint) (finish_time - start_time);
1632
1633
		srv_n_lock_wait_current_count--;
1634
		srv_n_lock_wait_time = srv_n_lock_wait_time + diff_time;
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
1635
		if (diff_time > srv_n_lock_max_wait_time &&
1636
		    /* only update the variable if we successfully
1637
		    retrieved the start and finish times. See Bug#36819. */
1638
		    start_time != -1 && finish_time != -1) {
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1639
			srv_n_lock_max_wait_time = diff_time;
1640
		}
1641
	}
1642
1643
	if (trx->was_chosen_as_deadlock_victim) {
1644
1645
		trx->error_state = DB_DEADLOCK;
1646
		trx->was_chosen_as_deadlock_victim = FALSE;
1647
	}
1648
1649
	mutex_exit(&kernel_mutex);
1650
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
1651
	/* InnoDB system transactions (such as the purge, and
1652
	incomplete transactions that are being rolled back after crash
1653
	recovery) will use the global value of
1654
	innodb_lock_wait_timeout, because trx->mysql_thd == NULL. */
1655
	lock_wait_timeout = thd_lock_wait_timeout(trx->mysql_thd);
1656
1657
	if (lock_wait_timeout < 100000000
1658
	    && wait_time > (double) lock_wait_timeout) {
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1659
1660
		trx->error_state = DB_LOCK_WAIT_TIMEOUT;
1661
	}
1662
}
1663
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1664
/********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1665
Releases a MySQL OS thread waiting for a lock to be released, if the
1666
thread is already suspended. */
1667
UNIV_INTERN
1668
void
1669
srv_release_mysql_thread_if_suspended(
1670
/*==================================*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1671
	que_thr_t*	thr)	/*!< in: query thread associated with the
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1672
				MySQL OS thread	 */
1673
{
1674
	srv_slot_t*	slot;
1675
	ulint		i;
1676
1677
	ut_ad(mutex_own(&kernel_mutex));
1678
1679
	for (i = 0; i < OS_THREAD_MAX_N; i++) {
1680
1681
		slot = srv_mysql_table + i;
1682
1683
		if (slot->in_use && slot->thr == thr) {
1684
			/* Found */
1685
1686
			os_event_set(slot->event);
1687
1688
			return;
1689
		}
1690
	}
1691
1692
	/* not found */
1693
}
1694
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1695
/******************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1696
Refreshes the values used to calculate per-second averages. */
1697
static
1698
void
1699
srv_refresh_innodb_monitor_stats(void)
1700
/*==================================*/
1701
{
1702
	mutex_enter(&srv_innodb_monitor_mutex);
1703
1704
	srv_last_monitor_time = time(NULL);
1705
1706
	os_aio_refresh_stats();
1707
1708
	btr_cur_n_sea_old = btr_cur_n_sea;
1709
	btr_cur_n_non_sea_old = btr_cur_n_non_sea;
1710
1711
	log_refresh_stats();
1712
1713
	buf_refresh_io_stats();
1714
1715
	srv_n_rows_inserted_old = srv_n_rows_inserted;
1716
	srv_n_rows_updated_old = srv_n_rows_updated;
1717
	srv_n_rows_deleted_old = srv_n_rows_deleted;
1718
	srv_n_rows_read_old = srv_n_rows_read;
1719
1720
	mutex_exit(&srv_innodb_monitor_mutex);
1721
}
1722
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1723
/******************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1724
Outputs to a file the output of the InnoDB Monitor. */
1725
UNIV_INTERN
1726
void
1727
srv_printf_innodb_monitor(
1728
/*======================*/
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1729
	FILE*	file,		/*!< in: output stream */
1730
	ulint*	trx_start,	/*!< out: file position of the start of
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1731
				the list of active transactions */
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1732
	ulint*	trx_end)	/*!< out: file position of the end of
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1733
				the list of active transactions */
1734
{
1735
	double	time_elapsed;
1736
	time_t	current_time;
1737
	ulint	n_reserved;
1738
1739
	mutex_enter(&srv_innodb_monitor_mutex);
1740
1741
	current_time = time(NULL);
1742
1743
	/* We add 0.001 seconds to time_elapsed to prevent division
1744
	by zero if two users happen to call SHOW INNODB STATUS at the same
1745
	time */
1746
1747
	time_elapsed = difftime(current_time, srv_last_monitor_time)
1748
		+ 0.001;
1749
1750
	srv_last_monitor_time = time(NULL);
1751
1752
	fputs("\n=====================================\n", file);
1753
1754
	ut_print_timestamp(file);
1755
	fprintf(file,
1756
		" INNODB MONITOR OUTPUT\n"
1757
		"=====================================\n"
1758
		"Per second averages calculated from the last %lu seconds\n",
1759
		(ulong)time_elapsed);
1760
1761
	fputs("----------\n"
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1762
		"BACKGROUND THREAD\n"
1763
		"----------\n", file);
1764
	srv_print_master_thread_info(file);
1765
1766
	fputs("----------\n"
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1767
	      "SEMAPHORES\n"
1768
	      "----------\n", file);
1769
	sync_print(file);
1770
1771
	/* Conceptually, srv_innodb_monitor_mutex has a very high latching
1772
	order level in sync0sync.h, while dict_foreign_err_mutex has a very
1773
	low level 135. Therefore we can reserve the latter mutex here without
1774
	a danger of a deadlock of threads. */
1775
1776
	mutex_enter(&dict_foreign_err_mutex);
1777
1778
	if (ftell(dict_foreign_err_file) != 0L) {
1779
		fputs("------------------------\n"
1780
		      "LATEST FOREIGN KEY ERROR\n"
1781
		      "------------------------\n", file);
1782
		ut_copy_file(file, dict_foreign_err_file);
1783
	}
1784
1785
	mutex_exit(&dict_foreign_err_mutex);
1786
1787
	lock_print_info_summary(file);
1788
	if (trx_start) {
1789
		long	t = ftell(file);
1790
		if (t < 0) {
1791
			*trx_start = ULINT_UNDEFINED;
1792
		} else {
1793
			*trx_start = (ulint) t;
1794
		}
1795
	}
1796
	lock_print_info_all_transactions(file);
1797
	if (trx_end) {
1798
		long	t = ftell(file);
1799
		if (t < 0) {
1800
			*trx_end = ULINT_UNDEFINED;
1801
		} else {
1802
			*trx_end = (ulint) t;
1803
		}
1804
	}
1805
	fputs("--------\n"
1806
	      "FILE I/O\n"
1807
	      "--------\n", file);
1808
	os_aio_print(file);
1809
1810
	fputs("-------------------------------------\n"
1811
	      "INSERT BUFFER AND ADAPTIVE HASH INDEX\n"
1812
	      "-------------------------------------\n", file);
1813
	ibuf_print(file);
1814
1815
	ha_print_info(file, btr_search_sys->hash_index);
1816
1817
	fprintf(file,
1818
		"%.2f hash searches/s, %.2f non-hash searches/s\n",
1819
		(btr_cur_n_sea - btr_cur_n_sea_old)
1820
		/ time_elapsed,
1821
		(btr_cur_n_non_sea - btr_cur_n_non_sea_old)
1822
		/ time_elapsed);
1823
	btr_cur_n_sea_old = btr_cur_n_sea;
1824
	btr_cur_n_non_sea_old = btr_cur_n_non_sea;
1825
1826
	fputs("---\n"
1827
	      "LOG\n"
1828
	      "---\n", file);
1829
	log_print(file);
1830
1831
	fputs("----------------------\n"
1832
	      "BUFFER POOL AND MEMORY\n"
1833
	      "----------------------\n", file);
1834
	fprintf(file,
1835
		"Total memory allocated " ULINTPF
1836
		"; in additional pool allocated " ULINTPF "\n",
1837
		ut_total_allocated_memory,
1838
		mem_pool_get_reserved(mem_comm_pool));
1839
	fprintf(file, "Dictionary memory allocated " ULINTPF "\n",
1840
		dict_sys->size);
1841
1842
	buf_print_io(file);
1843
1844
	fputs("--------------\n"
1845
	      "ROW OPERATIONS\n"
1846
	      "--------------\n", file);
1847
	fprintf(file, "%ld queries inside InnoDB, %lu queries in queue\n",
1848
		(long) srv_conc_n_threads,
1849
		(ulong) srv_conc_n_waiting_threads);
1850
1851
	fprintf(file, "%lu read views open inside InnoDB\n",
1852
		UT_LIST_GET_LEN(trx_sys->view_list));
1853
1854
	n_reserved = fil_space_get_n_reserved_extents(0);
1855
	if (n_reserved > 0) {
1856
		fprintf(file,
1857
			"%lu tablespace extents now reserved for"
1858
			" B-tree split operations\n",
1859
			(ulong) n_reserved);
1860
	}
1861
1862
#ifdef UNIV_LINUX
1863
	fprintf(file, "Main thread process no. %lu, id %lu, state: %s\n",
1864
		(ulong) srv_main_thread_process_no,
1865
		(ulong) srv_main_thread_id,
1866
		srv_main_thread_op_info);
1867
#else
1868
	fprintf(file, "Main thread id %lu, state: %s\n",
1869
		(ulong) srv_main_thread_id,
1870
		srv_main_thread_op_info);
1871
#endif
1872
	fprintf(file,
1873
		"Number of rows inserted " ULINTPF
1874
		", updated " ULINTPF ", deleted " ULINTPF
1875
		", read " ULINTPF "\n",
1876
		srv_n_rows_inserted,
1877
		srv_n_rows_updated,
1878
		srv_n_rows_deleted,
1879
		srv_n_rows_read);
1880
	fprintf(file,
1881
		"%.2f inserts/s, %.2f updates/s,"
1882
		" %.2f deletes/s, %.2f reads/s\n",
1883
		(srv_n_rows_inserted - srv_n_rows_inserted_old)
1884
		/ time_elapsed,
1885
		(srv_n_rows_updated - srv_n_rows_updated_old)
1886
		/ time_elapsed,
1887
		(srv_n_rows_deleted - srv_n_rows_deleted_old)
1888
		/ time_elapsed,
1889
		(srv_n_rows_read - srv_n_rows_read_old)
1890
		/ time_elapsed);
1891
1892
	srv_n_rows_inserted_old = srv_n_rows_inserted;
1893
	srv_n_rows_updated_old = srv_n_rows_updated;
1894
	srv_n_rows_deleted_old = srv_n_rows_deleted;
1895
	srv_n_rows_read_old = srv_n_rows_read;
1896
1897
	fputs("----------------------------\n"
1898
	      "END OF INNODB MONITOR OUTPUT\n"
1899
	      "============================\n", file);
1900
	mutex_exit(&srv_innodb_monitor_mutex);
1901
	fflush(file);
1902
}
1903
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1904
/******************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1905
Function to pass InnoDB status variables to MySQL */
1906
UNIV_INTERN
1907
void
1908
srv_export_innodb_status(void)
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1909
/*==========================*/
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1910
{
1911
	mutex_enter(&srv_innodb_monitor_mutex);
1912
1913
	export_vars.innodb_data_pending_reads
1914
		= os_n_pending_reads;
1915
	export_vars.innodb_data_pending_writes
1916
		= os_n_pending_writes;
1917
	export_vars.innodb_data_pending_fsyncs
1918
		= fil_n_pending_log_flushes
1919
		+ fil_n_pending_tablespace_flushes;
1920
	export_vars.innodb_data_fsyncs = os_n_fsyncs;
1921
	export_vars.innodb_data_read = srv_data_read;
1922
	export_vars.innodb_data_reads = os_n_file_reads;
1923
	export_vars.innodb_data_writes = os_n_file_writes;
1924
	export_vars.innodb_data_written = srv_data_written;
1819.5.19 by stewart at flamingspork
[patch 019/129] Merge patch for revision 1805 from InnoDB SVN:
1925
	export_vars.innodb_buffer_pool_read_requests = buf_pool->stat.n_page_gets;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1926
	export_vars.innodb_buffer_pool_write_requests
1927
		= srv_buf_pool_write_requests;
1928
	export_vars.innodb_buffer_pool_wait_free = srv_buf_pool_wait_free;
1929
	export_vars.innodb_buffer_pool_pages_flushed = srv_buf_pool_flushed;
1930
	export_vars.innodb_buffer_pool_reads = srv_buf_pool_reads;
1819.5.19 by stewart at flamingspork
[patch 019/129] Merge patch for revision 1805 from InnoDB SVN:
1931
	export_vars.innodb_buffer_pool_read_ahead
1932
		= buf_pool->stat.n_ra_pages_read;
1933
	export_vars.innodb_buffer_pool_read_ahead_evicted
1934
		= buf_pool->stat.n_ra_pages_evicted;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1935
	export_vars.innodb_buffer_pool_pages_data
1936
		= UT_LIST_GET_LEN(buf_pool->LRU);
1937
	export_vars.innodb_buffer_pool_pages_dirty
1938
		= UT_LIST_GET_LEN(buf_pool->flush_list);
1939
	export_vars.innodb_buffer_pool_pages_free
1940
		= UT_LIST_GET_LEN(buf_pool->free);
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
1941
#ifdef UNIV_DEBUG
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1942
	export_vars.innodb_buffer_pool_pages_latched
1943
		= buf_get_latched_pages_number();
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
1944
#endif /* UNIV_DEBUG */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1945
	export_vars.innodb_buffer_pool_pages_total = buf_pool->curr_size;
1946
1947
	export_vars.innodb_buffer_pool_pages_misc = buf_pool->curr_size
1948
		- UT_LIST_GET_LEN(buf_pool->LRU)
1949
		- UT_LIST_GET_LEN(buf_pool->free);
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1950
#ifdef HAVE_ATOMIC_BUILTINS
641.2.2 by Monty Taylor
InnoDB Plugin 1.0.3
1951
	export_vars.innodb_have_atomic_builtins = 1;
1952
#else
1953
	export_vars.innodb_have_atomic_builtins = 0;
1954
#endif
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1955
	export_vars.innodb_page_size = UNIV_PAGE_SIZE;
1956
	export_vars.innodb_log_waits = srv_log_waits;
1957
	export_vars.innodb_os_log_written = srv_os_log_written;
1958
	export_vars.innodb_os_log_fsyncs = fil_n_log_flushes;
1959
	export_vars.innodb_os_log_pending_fsyncs = fil_n_pending_log_flushes;
1960
	export_vars.innodb_os_log_pending_writes = srv_os_log_pending_writes;
1961
	export_vars.innodb_log_write_requests = srv_log_write_requests;
1962
	export_vars.innodb_log_writes = srv_log_writes;
1963
	export_vars.innodb_dblwr_pages_written = srv_dblwr_pages_written;
1964
	export_vars.innodb_dblwr_writes = srv_dblwr_writes;
1819.5.19 by stewart at flamingspork
[patch 019/129] Merge patch for revision 1805 from InnoDB SVN:
1965
	export_vars.innodb_pages_created = buf_pool->stat.n_pages_created;
1966
	export_vars.innodb_pages_read = buf_pool->stat.n_pages_read;
1967
	export_vars.innodb_pages_written = buf_pool->stat.n_pages_written;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1968
	export_vars.innodb_row_lock_waits = srv_n_lock_wait_count;
1969
	export_vars.innodb_row_lock_current_waits
1970
		= srv_n_lock_wait_current_count;
1971
	export_vars.innodb_row_lock_time = srv_n_lock_wait_time / 1000;
1972
	if (srv_n_lock_wait_count > 0) {
1973
		export_vars.innodb_row_lock_time_avg = (ulint)
1974
			(srv_n_lock_wait_time / 1000 / srv_n_lock_wait_count);
1975
	} else {
1976
		export_vars.innodb_row_lock_time_avg = 0;
1977
	}
1978
	export_vars.innodb_row_lock_time_max
1979
		= srv_n_lock_max_wait_time / 1000;
1980
	export_vars.innodb_rows_read = srv_n_rows_read;
1981
	export_vars.innodb_rows_inserted = srv_n_rows_inserted;
1982
	export_vars.innodb_rows_updated = srv_n_rows_updated;
1983
	export_vars.innodb_rows_deleted = srv_n_rows_deleted;
1984
1985
	mutex_exit(&srv_innodb_monitor_mutex);
1986
}
1987
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1988
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1989
A thread which wakes up threads whose lock wait may have lasted too long.
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1990
This also prints the info output by various InnoDB monitors.
1991
@return	a dummy parameter */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1992
UNIV_INTERN
1993
os_thread_ret_t
1994
srv_lock_timeout_and_monitor_thread(
1995
/*================================*/
1996
	void*	arg __attribute__((unused)))
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
1997
			/*!< in: a dummy parameter required by
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
1998
			os_thread_create */
1999
{
2000
	srv_slot_t*	slot;
2001
	double		time_elapsed;
2002
	time_t		current_time;
2003
	time_t		last_table_monitor_time;
2004
	time_t		last_tablespace_monitor_time;
2005
	time_t		last_monitor_time;
2006
	ibool		some_waits;
2007
	double		wait_time;
2008
	ulint		i;
2009
2010
#ifdef UNIV_DEBUG_THREAD_CREATION
2011
	fprintf(stderr, "Lock timeout thread starts, id %lu\n",
2012
		os_thread_pf(os_thread_get_curr_id()));
2013
#endif
2014
	UT_NOT_USED(arg);
2015
	srv_last_monitor_time = time(NULL);
2016
	last_table_monitor_time = time(NULL);
2017
	last_tablespace_monitor_time = time(NULL);
2018
	last_monitor_time = time(NULL);
2019
loop:
2020
	srv_lock_timeout_and_monitor_active = TRUE;
2021
2022
	/* When someone is waiting for a lock, we wake up every second
2023
	and check if a timeout has passed for a lock wait */
2024
2025
	os_thread_sleep(1000000);
2026
2027
	current_time = time(NULL);
2028
2029
	time_elapsed = difftime(current_time, last_monitor_time);
2030
2031
	if (time_elapsed > 15) {
2032
		last_monitor_time = time(NULL);
2033
2034
		if (srv_print_innodb_monitor) {
2035
			srv_printf_innodb_monitor(stderr, NULL, NULL);
2036
		}
2037
2038
		if (srv_innodb_status) {
2039
			mutex_enter(&srv_monitor_file_mutex);
2040
			rewind(srv_monitor_file);
2041
			srv_printf_innodb_monitor(srv_monitor_file, NULL,
2042
						  NULL);
2043
			os_file_set_eof(srv_monitor_file);
2044
			mutex_exit(&srv_monitor_file_mutex);
2045
		}
2046
2047
		if (srv_print_innodb_tablespace_monitor
2048
		    && difftime(current_time,
2049
				last_tablespace_monitor_time) > 60) {
2050
			last_tablespace_monitor_time = time(NULL);
2051
2052
			fputs("========================"
2053
			      "========================\n",
2054
			      stderr);
2055
2056
			ut_print_timestamp(stderr);
2057
2058
			fputs(" INNODB TABLESPACE MONITOR OUTPUT\n"
2059
			      "========================"
2060
			      "========================\n",
2061
			      stderr);
2062
2063
			fsp_print(0);
2064
			fputs("Validating tablespace\n", stderr);
2065
			fsp_validate(0);
2066
			fputs("Validation ok\n"
2067
			      "---------------------------------------\n"
2068
			      "END OF INNODB TABLESPACE MONITOR OUTPUT\n"
2069
			      "=======================================\n",
2070
			      stderr);
2071
		}
2072
2073
		if (srv_print_innodb_table_monitor
2074
		    && difftime(current_time, last_table_monitor_time) > 60) {
2075
2076
			last_table_monitor_time = time(NULL);
2077
2078
			fputs("===========================================\n",
2079
			      stderr);
2080
2081
			ut_print_timestamp(stderr);
2082
2083
			fputs(" INNODB TABLE MONITOR OUTPUT\n"
2084
			      "===========================================\n",
2085
			      stderr);
2086
			dict_print();
2087
2088
			fputs("-----------------------------------\n"
2089
			      "END OF INNODB TABLE MONITOR OUTPUT\n"
2090
			      "==================================\n",
2091
			      stderr);
2092
		}
2093
	}
2094
2095
	mutex_enter(&kernel_mutex);
2096
2097
	some_waits = FALSE;
2098
2099
	/* Check of all slots if a thread is waiting there, and if it
2100
	has exceeded the time limit */
2101
2102
	for (i = 0; i < OS_THREAD_MAX_N; i++) {
2103
2104
		slot = srv_mysql_table + i;
2105
2106
		if (slot->in_use) {
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
2107
			trx_t*	trx;
2108
			ulong	lock_wait_timeout;
2109
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2110
			some_waits = TRUE;
2111
2112
			wait_time = ut_difftime(ut_time(), slot->suspend_time);
2113
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
2114
			trx = thr_get_trx(slot->thr);
2115
			lock_wait_timeout = thd_lock_wait_timeout(
2116
				trx->mysql_thd);
2117
2118
			if (lock_wait_timeout < 100000000
2119
			    && (wait_time > (double) lock_wait_timeout
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2120
				|| wait_time < 0)) {
2121
2122
				/* Timeout exceeded or a wrap-around in system
2123
				time counter: cancel the lock request queued
2124
				by the transaction and release possible
2125
				other transactions waiting behind; it is
2126
				possible that the lock has already been
2127
				granted: in that case do nothing */
2128
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
2129
				if (trx->wait_lock) {
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2130
					lock_cancel_waiting_and_release(
641.2.1 by Monty Taylor
InnoDB Plugin 1.0.2
2131
						trx->wait_lock);
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2132
				}
2133
			}
2134
		}
2135
	}
2136
2137
	os_event_reset(srv_lock_timeout_thread_event);
2138
2139
	mutex_exit(&kernel_mutex);
2140
2141
	if (srv_shutdown_state >= SRV_SHUTDOWN_CLEANUP) {
2142
		goto exit_func;
2143
	}
2144
2145
	if (some_waits || srv_print_innodb_monitor
2146
	    || srv_print_innodb_lock_monitor
2147
	    || srv_print_innodb_tablespace_monitor
2148
	    || srv_print_innodb_table_monitor) {
2149
		goto loop;
2150
	}
2151
2152
	/* No one was waiting for a lock and no monitor was active:
2153
	suspend this thread */
2154
2155
	srv_lock_timeout_and_monitor_active = FALSE;
2156
2157
#if 0
2158
	/* The following synchronisation is disabled, since
2159
	the InnoDB monitor output is to be updated every 15 seconds. */
2160
	os_event_wait(srv_lock_timeout_thread_event);
2161
#endif
2162
	goto loop;
2163
2164
exit_func:
2165
	srv_lock_timeout_and_monitor_active = FALSE;
2166
2167
	/* We count the number of threads in os_thread_exit(). A created
2168
	thread should always use that to exit and not use return() to exit. */
2169
2170
	os_thread_exit(NULL);
2171
2172
	OS_THREAD_DUMMY_RETURN;
2173
}
2174
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2175
/*********************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2176
A thread which prints warnings about semaphore waits which have lasted
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2177
too long. These can be used to track bugs which cause hangs.
2178
@return	a dummy parameter */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2179
UNIV_INTERN
2180
os_thread_ret_t
2181
srv_error_monitor_thread(
2182
/*=====================*/
2183
	void*	arg __attribute__((unused)))
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2184
			/*!< in: a dummy parameter required by
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2185
			os_thread_create */
2186
{
2187
	/* number of successive fatal timeouts observed */
2188
	ulint		fatal_cnt	= 0;
2189
	ib_uint64_t	old_lsn;
2190
	ib_uint64_t	new_lsn;
2191
2192
	old_lsn = srv_start_lsn;
2193
2194
#ifdef UNIV_DEBUG_THREAD_CREATION
2195
	fprintf(stderr, "Error monitor thread starts, id %lu\n",
2196
		os_thread_pf(os_thread_get_curr_id()));
2197
#endif
2198
loop:
2199
	srv_error_monitor_active = TRUE;
2200
2201
	/* Try to track a strange bug reported by Harald Fuchs and others,
2202
	where the lsn seems to decrease at times */
2203
2204
	new_lsn = log_get_lsn();
2205
2206
	if (new_lsn < old_lsn) {
2207
		ut_print_timestamp(stderr);
2208
		fprintf(stderr,
641.1.4 by Monty Taylor
Merged in InnoDB changes.
2209
			"  InnoDB: Error: old log sequence number %"PRIu64""
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2210
			" was greater\n"
641.1.4 by Monty Taylor
Merged in InnoDB changes.
2211
			"InnoDB: than the new log sequence number %"PRIu64"!\n"
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2212
			"InnoDB: Please submit a bug report"
2213
			" to http://bugs.mysql.com\n",
2214
			old_lsn, new_lsn);
2215
	}
2216
2217
	old_lsn = new_lsn;
2218
2219
	if (difftime(time(NULL), srv_last_monitor_time) > 60) {
2220
		/* We referesh InnoDB Monitor values so that averages are
2221
		printed from at most 60 last seconds */
2222
2223
		srv_refresh_innodb_monitor_stats();
2224
	}
2225
2226
	/* Update the statistics collected for deciding LRU
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2227
	eviction policy. */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2228
	buf_LRU_stat_update();
2229
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2230
	/* Update the statistics collected for flush rate policy. */
2231
	buf_flush_stat_update();
2232
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2233
	/* In case mutex_exit is not a memory barrier, it is
2234
	theoretically possible some threads are left waiting though
2235
	the semaphore is already released. Wake up those threads: */
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2236
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2237
	sync_arr_wake_threads_if_sema_free();
2238
2239
	if (sync_array_print_long_waits()) {
2240
		fatal_cnt++;
2241
		if (fatal_cnt > 10) {
2242
2243
			fprintf(stderr,
2244
				"InnoDB: Error: semaphore wait has lasted"
2245
				" > %lu seconds\n"
2246
				"InnoDB: We intentionally crash the server,"
2247
				" because it appears to be hung.\n",
2248
				(ulong) srv_fatal_semaphore_wait_threshold);
2249
2250
			ut_error;
2251
		}
2252
	} else {
2253
		fatal_cnt = 0;
2254
	}
2255
2256
	/* Flush stderr so that a database user gets the output
2257
	to possible MySQL error file */
2258
2259
	fflush(stderr);
2260
2261
	os_thread_sleep(1000000);
2262
2263
	if (srv_shutdown_state < SRV_SHUTDOWN_CLEANUP) {
2264
2265
		goto loop;
2266
	}
2267
2268
	srv_error_monitor_active = FALSE;
2269
2270
	/* We count the number of threads in os_thread_exit(). A created
2271
	thread should always use that to exit and not use return() to exit. */
2272
2273
	os_thread_exit(NULL);
2274
2275
	OS_THREAD_DUMMY_RETURN;
2276
}
2277
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2278
/*******************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2279
Tells the InnoDB server that there has been activity in the database
2280
and wakes up the master thread if it is suspended (not sleeping). Used
2281
in the MySQL interface. Note that there is a small chance that the master
2282
thread stays suspended (we do not protect our operation with the kernel
2283
mutex, for performace reasons). */
2284
UNIV_INTERN
2285
void
2286
srv_active_wake_master_thread(void)
2287
/*===============================*/
2288
{
2289
	srv_activity_count++;
2290
2291
	if (srv_n_threads_active[SRV_MASTER] == 0) {
2292
2293
		mutex_enter(&kernel_mutex);
2294
2295
		srv_release_threads(SRV_MASTER, 1);
2296
2297
		mutex_exit(&kernel_mutex);
2298
	}
2299
}
2300
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2301
/*******************************************************************//**
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2302
Wakes up the master thread if it is suspended or being suspended. */
2303
UNIV_INTERN
2304
void
2305
srv_wake_master_thread(void)
2306
/*========================*/
2307
{
2308
	srv_activity_count++;
2309
2310
	mutex_enter(&kernel_mutex);
2311
2312
	srv_release_threads(SRV_MASTER, 1);
2313
2314
	mutex_exit(&kernel_mutex);
2315
}
2316
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2317
/**********************************************************************
2318
The master thread is tasked to ensure that flush of log file happens
2319
once every second in the background. This is to ensure that not more
2320
than one second of trxs are lost in case of crash when
2321
innodb_flush_logs_at_trx_commit != 1 */
2322
static
2323
void
2324
srv_sync_log_buffer_in_background(void)
2325
/*===================================*/
2326
{
2327
	time_t	current_time = time(NULL);
2328
2329
	srv_main_thread_op_info = "flushing log";
2330
	if (difftime(current_time, srv_last_log_flush_time) >= 1) {
2331
		log_buffer_sync_in_background(TRUE);
2332
		srv_last_log_flush_time = current_time;
2333
		srv_log_writes_and_flush++;
2334
	}
2335
}
2336
2337
/*********************************************************************//**
2338
The master thread controlling the server.
2339
@return	a dummy parameter */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2340
UNIV_INTERN
2341
os_thread_ret_t
2342
srv_master_thread(
2343
/*==============*/
2344
	void*	arg __attribute__((unused)))
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2345
			/*!< in: a dummy parameter required by
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2346
			os_thread_create */
2347
{
2348
	os_event_t	event;
2349
	ulint		old_activity_count;
2350
	ulint		n_pages_purged	= 0;
2351
	ulint		n_bytes_merged;
2352
	ulint		n_pages_flushed;
2353
	ulint		n_bytes_archived;
2354
	ulint		n_tables_to_drop;
2355
	ulint		n_ios;
2356
	ulint		n_ios_old;
2357
	ulint		n_ios_very_old;
2358
	ulint		n_pend_ios;
2359
	ibool		skip_sleep	= FALSE;
2360
	ulint		i;
2361
2362
#ifdef UNIV_DEBUG_THREAD_CREATION
2363
	fprintf(stderr, "Master thread starts, id %lu\n",
2364
		os_thread_pf(os_thread_get_curr_id()));
2365
#endif
2366
	srv_main_thread_process_no = os_proc_get_number();
2367
	srv_main_thread_id = os_thread_pf(os_thread_get_curr_id());
2368
2369
	srv_table_reserve_slot(SRV_MASTER);
2370
2371
	mutex_enter(&kernel_mutex);
2372
2373
	srv_n_threads_active[SRV_MASTER]++;
2374
2375
	mutex_exit(&kernel_mutex);
2376
2377
loop:
2378
	/*****************************************************************/
2379
	/* ---- When there is database activity by users, we cycle in this
2380
	loop */
2381
2382
	srv_main_thread_op_info = "reserving kernel mutex";
2383
1819.5.19 by stewart at flamingspork
[patch 019/129] Merge patch for revision 1805 from InnoDB SVN:
2384
	n_ios_very_old = log_sys->n_log_ios + buf_pool->stat.n_pages_read
2385
		+ buf_pool->stat.n_pages_written;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2386
	mutex_enter(&kernel_mutex);
2387
2388
	/* Store the user activity counter at the start of this loop */
2389
	old_activity_count = srv_activity_count;
2390
2391
	mutex_exit(&kernel_mutex);
2392
2393
	if (srv_force_recovery >= SRV_FORCE_NO_BACKGROUND) {
2394
2395
		goto suspend_thread;
2396
	}
2397
2398
	/* ---- We run the following loop approximately once per second
2399
	when there is database activity */
2400
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2401
	srv_last_log_flush_time = time(NULL);
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2402
	skip_sleep = FALSE;
2403
2404
	for (i = 0; i < 10; i++) {
1819.5.19 by stewart at flamingspork
[patch 019/129] Merge patch for revision 1805 from InnoDB SVN:
2405
		n_ios_old = log_sys->n_log_ios + buf_pool->stat.n_pages_read
2406
			+ buf_pool->stat.n_pages_written;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2407
		srv_main_thread_op_info = "sleeping";
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2408
		srv_main_1_second_loops++;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2409
2410
		if (!skip_sleep) {
2411
2412
			os_thread_sleep(1000000);
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2413
			srv_main_sleeps++;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2414
		}
2415
2416
		skip_sleep = FALSE;
2417
2418
		/* ALTER TABLE in MySQL requires on Unix that the table handler
2419
		can drop tables lazily after there no longer are SELECT
2420
		queries to them. */
2421
2422
		srv_main_thread_op_info = "doing background drop tables";
2423
2424
		row_drop_tables_for_mysql_in_background();
2425
2426
		srv_main_thread_op_info = "";
2427
2428
		if (srv_fast_shutdown && srv_shutdown_state > 0) {
2429
2430
			goto background_loop;
2431
		}
2432
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2433
		/* Flush logs if needed */
2434
		srv_sync_log_buffer_in_background();
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2435
2436
		srv_main_thread_op_info = "making checkpoint";
2437
		log_free_check();
2438
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2439
		/* If i/os during one second sleep were less than 5% of
2440
                capacity, we assume that there is free disk i/o capacity
2441
                available, and it makes sense to do an insert buffer merge. */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2442
2443
		n_pend_ios = buf_get_n_pending_ios()
2444
			+ log_sys->n_pending_writes;
1819.5.19 by stewart at flamingspork
[patch 019/129] Merge patch for revision 1805 from InnoDB SVN:
2445
		n_ios = log_sys->n_log_ios + buf_pool->stat.n_pages_read
2446
			+ buf_pool->stat.n_pages_written;
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2447
		if (n_pend_ios < SRV_PEND_IO_THRESHOLD
2448
		    && (n_ios - n_ios_old < SRV_RECENT_IO_ACTIVITY)) {
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2449
			srv_main_thread_op_info = "doing insert buffer merge";
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2450
			ibuf_contract_for_n_pages(FALSE, PCT_IO(5));
2451
2452
			/* Flush logs if needed */
2453
			srv_sync_log_buffer_in_background();
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2454
		}
2455
2456
		if (UNIV_UNLIKELY(buf_get_modified_ratio_pct()
2457
				  > srv_max_buf_pool_modified_pct)) {
2458
2459
			/* Try to keep the number of modified pages in the
2460
			buffer pool under the limit wished by the user */
2461
1819.5.19 by stewart at flamingspork
[patch 019/129] Merge patch for revision 1805 from InnoDB SVN:
2462
			srv_main_thread_op_info =
2463
				"flushing buffer pool pages";
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2464
			n_pages_flushed = buf_flush_batch(BUF_FLUSH_LIST,
2465
							  PCT_IO(100),
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2466
							  IB_ULONGLONG_MAX);
2467
2468
			/* If we had to do the flush, it may have taken
2469
			even more than 1 second, and also, there may be more
2470
			to flush. Do not sleep 1 second during the next
2471
			iteration of this loop. */
2472
2473
			skip_sleep = TRUE;
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2474
		} else if (srv_adaptive_flushing) {
2475
2476
			/* Try to keep the rate of flushing of dirty
2477
			pages such that redo log generation does not
2478
			produce bursts of IO at checkpoint time. */
2479
			ulint n_flush = buf_flush_get_desired_flush_rate();
2480
2481
			if (n_flush) {
1819.5.19 by stewart at flamingspork
[patch 019/129] Merge patch for revision 1805 from InnoDB SVN:
2482
				srv_main_thread_op_info =
2483
					"flushing buffer pool pages";
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2484
				n_flush = ut_min(PCT_IO(100), n_flush);
2485
				n_pages_flushed =
2486
					buf_flush_batch(
2487
						BUF_FLUSH_LIST,
2488
						n_flush,
2489
						IB_ULONGLONG_MAX);
2490
				skip_sleep = TRUE;
2491
			}
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2492
		}
2493
2494
		if (srv_activity_count == old_activity_count) {
2495
2496
			/* There is no user activity at the moment, go to
2497
			the background loop */
2498
2499
			goto background_loop;
2500
		}
2501
	}
2502
2503
	/* ---- We perform the following code approximately once per
2504
	10 seconds when there is database activity */
2505
2506
#ifdef MEM_PERIODIC_CHECK
2507
	/* Check magic numbers of every allocated mem block once in 10
2508
	seconds */
2509
	mem_validate_all_blocks();
2510
#endif
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2511
	/* If i/os during the 10 second period were less than 200% of
2512
	capacity, we assume that there is free disk i/o capacity
2513
	available, and it makes sense to flush srv_io_capacity pages.
2514
2515
	Note that this is done regardless of the fraction of dirty
2516
	pages relative to the max requested by the user. The one second
2517
	loop above requests writes for that case. The writes done here
2518
	are not required, and may be disabled. */
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2519
2520
	n_pend_ios = buf_get_n_pending_ios() + log_sys->n_pending_writes;
1819.5.19 by stewart at flamingspork
[patch 019/129] Merge patch for revision 1805 from InnoDB SVN:
2521
	n_ios = log_sys->n_log_ios + buf_pool->stat.n_pages_read
2522
		+ buf_pool->stat.n_pages_written;
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2523
2524
	srv_main_10_second_loops++;
2525
	if (n_pend_ios < SRV_PEND_IO_THRESHOLD
2526
	    && (n_ios - n_ios_very_old < SRV_PAST_IO_ACTIVITY)) {
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2527
2528
		srv_main_thread_op_info = "flushing buffer pool pages";
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2529
		buf_flush_batch(BUF_FLUSH_LIST, PCT_IO(100),
2530
				IB_ULONGLONG_MAX);
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2531
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2532
		/* Flush logs if needed */
2533
		srv_sync_log_buffer_in_background();
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2534
	}
2535
2536
	/* We run a batch of insert buffer merge every 10 seconds,
2537
	even if the server were active */
2538
2539
	srv_main_thread_op_info = "doing insert buffer merge";
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2540
	ibuf_contract_for_n_pages(FALSE, PCT_IO(5));
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2541
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2542
	/* Flush logs if needed */
2543
	srv_sync_log_buffer_in_background();
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2544
2545
	/* We run a full purge every 10 seconds, even if the server
2546
	were active */
2547
	do {
2548
2549
		if (srv_fast_shutdown && srv_shutdown_state > 0) {
2550
2551
			goto background_loop;
2552
		}
2553
2554
		srv_main_thread_op_info = "purging";
2555
		n_pages_purged = trx_purge();
2556
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2557
		/* Flush logs if needed */
2558
		srv_sync_log_buffer_in_background();
2559
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2560
	} while (n_pages_purged);
2561
2562
	srv_main_thread_op_info = "flushing buffer pool pages";
2563
2564
	/* Flush a few oldest pages to make a new checkpoint younger */
2565
2566
	if (buf_get_modified_ratio_pct() > 70) {
2567
2568
		/* If there are lots of modified pages in the buffer pool
2569
		(> 70 %), we assume we can afford reserving the disk(s) for
2570
		the time it requires to flush 100 pages */
2571
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2572
		n_pages_flushed = buf_flush_batch(BUF_FLUSH_LIST,
2573
						  PCT_IO(100),
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2574
						  IB_ULONGLONG_MAX);
2575
	} else {
2576
		/* Otherwise, we only flush a small number of pages so that
2577
		we do not unnecessarily use much disk i/o capacity from
2578
		other work */
2579
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2580
		n_pages_flushed = buf_flush_batch(BUF_FLUSH_LIST,
2581
						  PCT_IO(10),
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2582
						  IB_ULONGLONG_MAX);
2583
	}
2584
2585
	srv_main_thread_op_info = "making checkpoint";
2586
2587
	/* Make a new checkpoint about once in 10 seconds */
2588
2589
	log_checkpoint(TRUE, FALSE);
2590
2591
	srv_main_thread_op_info = "reserving kernel mutex";
2592
2593
	mutex_enter(&kernel_mutex);
2594
2595
	/* ---- When there is database activity, we jump from here back to
2596
	the start of loop */
2597
2598
	if (srv_activity_count != old_activity_count) {
2599
		mutex_exit(&kernel_mutex);
2600
		goto loop;
2601
	}
2602
2603
	mutex_exit(&kernel_mutex);
2604
2605
	/* If the database is quiet, we enter the background loop */
2606
2607
	/*****************************************************************/
2608
background_loop:
2609
	/* ---- In this loop we run background operations when the server
2610
	is quiet from user activity. Also in the case of a shutdown, we
2611
	loop here, flushing the buffer pool to the data files. */
2612
2613
	/* The server has been quiet for a while: start running background
2614
	operations */
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2615
	srv_main_background_loops++;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2616
	srv_main_thread_op_info = "doing background drop tables";
2617
2618
	n_tables_to_drop = row_drop_tables_for_mysql_in_background();
2619
2620
	if (n_tables_to_drop > 0) {
2621
		/* Do not monopolize the CPU even if there are tables waiting
2622
		in the background drop queue. (It is essentially a bug if
2623
		MySQL tries to drop a table while there are still open handles
2624
		to it and we had to put it to the background drop queue.) */
2625
2626
		os_thread_sleep(100000);
2627
	}
2628
2629
	srv_main_thread_op_info = "purging";
2630
2631
	/* Run a full purge */
2632
	do {
2633
		if (srv_fast_shutdown && srv_shutdown_state > 0) {
2634
2635
			break;
2636
		}
2637
2638
		srv_main_thread_op_info = "purging";
2639
		n_pages_purged = trx_purge();
2640
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2641
		/* Flush logs if needed */
2642
		srv_sync_log_buffer_in_background();
2643
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2644
	} while (n_pages_purged);
2645
2646
	srv_main_thread_op_info = "reserving kernel mutex";
2647
2648
	mutex_enter(&kernel_mutex);
2649
	if (srv_activity_count != old_activity_count) {
2650
		mutex_exit(&kernel_mutex);
2651
		goto loop;
2652
	}
2653
	mutex_exit(&kernel_mutex);
2654
2655
	srv_main_thread_op_info = "doing insert buffer merge";
2656
2657
	if (srv_fast_shutdown && srv_shutdown_state > 0) {
2658
		n_bytes_merged = 0;
2659
	} else {
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2660
		/* This should do an amount of IO similar to the number of
2661
		dirty pages that will be flushed in the call to
2662
		buf_flush_batch below. Otherwise, the system favors
2663
		clean pages over cleanup throughput. */
2664
		n_bytes_merged = ibuf_contract_for_n_pages(FALSE,
2665
							   PCT_IO(100));
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2666
	}
2667
2668
	srv_main_thread_op_info = "reserving kernel mutex";
2669
2670
	mutex_enter(&kernel_mutex);
2671
	if (srv_activity_count != old_activity_count) {
2672
		mutex_exit(&kernel_mutex);
2673
		goto loop;
2674
	}
2675
	mutex_exit(&kernel_mutex);
2676
2677
flush_loop:
2678
	srv_main_thread_op_info = "flushing buffer pool pages";
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2679
	srv_main_flush_loops++;
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2680
	if (srv_fast_shutdown < 2) {
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2681
		n_pages_flushed = buf_flush_batch(BUF_FLUSH_LIST,
2682
						  PCT_IO(100),
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2683
						  IB_ULONGLONG_MAX);
2684
	} else {
2685
		/* In the fastest shutdown we do not flush the buffer pool
2686
		to data files: we set n_pages_flushed to 0 artificially. */
2687
2688
		n_pages_flushed = 0;
2689
	}
2690
2691
	srv_main_thread_op_info = "reserving kernel mutex";
2692
2693
	mutex_enter(&kernel_mutex);
2694
	if (srv_activity_count != old_activity_count) {
2695
		mutex_exit(&kernel_mutex);
2696
		goto loop;
2697
	}
2698
	mutex_exit(&kernel_mutex);
2699
2700
	srv_main_thread_op_info = "waiting for buffer pool flush to end";
2701
	buf_flush_wait_batch_end(BUF_FLUSH_LIST);
2702
641.2.3 by Monty Taylor
InnoDB Plugin 1.0.4
2703
	/* Flush logs if needed */
2704
	srv_sync_log_buffer_in_background();
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2705
2706
	srv_main_thread_op_info = "making checkpoint";
2707
2708
	log_checkpoint(TRUE, FALSE);
2709
2710
	if (buf_get_modified_ratio_pct() > srv_max_buf_pool_modified_pct) {
2711
2712
		/* Try to keep the number of modified pages in the
2713
		buffer pool under the limit wished by the user */
2714
2715
		goto flush_loop;
2716
	}
2717
2718
	srv_main_thread_op_info = "reserving kernel mutex";
2719
2720
	mutex_enter(&kernel_mutex);
2721
	if (srv_activity_count != old_activity_count) {
2722
		mutex_exit(&kernel_mutex);
2723
		goto loop;
2724
	}
2725
	mutex_exit(&kernel_mutex);
2726
	/*
2727
	srv_main_thread_op_info = "archiving log (if log archive is on)";
2728
2729
	log_archive_do(FALSE, &n_bytes_archived);
2730
	*/
2731
	n_bytes_archived = 0;
2732
2733
	/* Keep looping in the background loop if still work to do */
2734
2735
	if (srv_fast_shutdown && srv_shutdown_state > 0) {
2736
		if (n_tables_to_drop + n_pages_flushed
2737
		    + n_bytes_archived != 0) {
2738
2739
			/* If we are doing a fast shutdown (= the default)
2740
			we do not do purge or insert buffer merge. But we
2741
			flush the buffer pool completely to disk.
2742
			In a 'very fast' shutdown we do not flush the buffer
2743
			pool to data files: we have set n_pages_flushed to
2744
			0 artificially. */
2745
2746
			goto background_loop;
2747
		}
2748
	} else if (n_tables_to_drop
2749
		   + n_pages_purged + n_bytes_merged + n_pages_flushed
2750
		   + n_bytes_archived != 0) {
2751
		/* In a 'slow' shutdown we run purge and the insert buffer
2752
		merge to completion */
2753
2754
		goto background_loop;
2755
	}
2756
2757
	/* There is no work for background operations either: suspend
2758
	master thread to wait for more server activity */
2759
2760
suspend_thread:
2761
	srv_main_thread_op_info = "suspending";
2762
2763
	mutex_enter(&kernel_mutex);
2764
2765
	if (row_get_background_drop_list_len_low() > 0) {
2766
		mutex_exit(&kernel_mutex);
2767
2768
		goto loop;
2769
	}
2770
2771
	event = srv_suspend_thread();
2772
2773
	mutex_exit(&kernel_mutex);
2774
2775
	/* DO NOT CHANGE THIS STRING. innobase_start_or_create_for_mysql()
2776
	waits for database activity to die down when converting < 4.1.x
2777
	databases, and relies on this string being exactly as it is. InnoDB
2778
	manual also mentions this string in several places. */
2779
	srv_main_thread_op_info = "waiting for server activity";
2780
2781
	os_event_wait(event);
2782
2783
	if (srv_shutdown_state == SRV_SHUTDOWN_EXIT_THREADS) {
2784
		/* This is only extra safety, the thread should exit
2785
		already when the event wait ends */
2786
2787
		os_thread_exit(NULL);
2788
	}
2789
2790
	/* When there is user activity, InnoDB will set the event and the
2791
	main thread goes back to loop. */
2792
2793
	goto loop;
2794
779.3.18 by Monty Taylor
Cleaned up warnings up through innodb.
2795
971.4.1 by Monty Taylor
GCC on Solaris build fixes.
2796
#if (!defined(__SUNPRO_C) && !defined(__SUNPRO_CC))
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2797
	OS_THREAD_DUMMY_RETURN;	/* Not reached, avoid compiler warning */
779.3.18 by Monty Taylor
Cleaned up warnings up through innodb.
2798
#endif
641.1.2 by Monty Taylor
Imported 1.0.1 with clean - with no changes.
2799
}