forked from mysql/mysql-server
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathbinlog.h
934 lines (788 loc) · 33 KB
/
binlog.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
#ifndef BINLOG_H_INCLUDED
/* Copyright (c) 2010, 2018, Oracle and/or its affiliates. All rights reserved.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License, version 2.0,
as published by the Free Software Foundation.
This program is also distributed with certain software (including
but not limited to OpenSSL) that is licensed under separate terms,
as designated in a particular file or component or in included license
documentation. The authors of MySQL hereby grant you an additional
permission to link the program and your derivative works with the
separately licensed software that they have included with MySQL.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License, version 2.0, for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */
#define BINLOG_H_INCLUDED
#include <string.h>
#include <sys/types.h>
#include <time.h>
#include <atomic>
#include <utility>
#include "binlog_event.h" // enum_binlog_checksum_alg
#include "m_string.h" // llstr
#include "my_dbug.h"
#include "my_inttypes.h"
#include "my_io.h"
#include "my_sharedlib.h"
#include "my_sys.h"
#include "mysql/components/services/mysql_cond_bits.h"
#include "mysql/components/services/mysql_mutex_bits.h"
#include "mysql/components/services/psi_cond_bits.h"
#include "mysql/components/services/psi_file_bits.h"
#include "mysql/components/services/psi_mutex_bits.h"
#include "mysql/psi/mysql_cond.h"
#include "mysql/psi/mysql_mutex.h"
#include "mysql/udf_registration_types.h"
#include "mysql_com.h" // Item_result
#include "sql/rpl_trx_tracking.h"
#include "sql/tc_log.h" // TC_LOG
#include "thr_mutex.h"
class Format_description_log_event;
class Gtid_monitoring_info;
class Gtid_set;
class Ha_trx_info;
class Incident_log_event;
class Log_event;
class Master_info;
class Relay_log_info;
class Rows_log_event;
class Sid_map;
class THD;
class Transaction_boundary_parser;
class binlog_cache_data;
class user_var_entry;
class Binlog_cache_storage;
struct Gtid;
typedef int64 query_id_t;
/*
Maximum unique log filename extension.
Note: setting to 0x7FFFFFFF due to atol windows
overflow/truncate.
*/
#define MAX_LOG_UNIQUE_FN_EXT 0x7FFFFFFF
struct Binlog_user_var_event {
user_var_entry *user_var_event;
char *value;
ulong length;
Item_result type;
uint charset_number;
bool unsigned_flag;
};
/**
Class for maintaining the commit stages for binary log group commit.
*/
class Stage_manager {
public:
class Mutex_queue {
friend class Stage_manager;
public:
Mutex_queue() : m_first(NULL), m_last(&m_first), m_size(0) {}
void init(PSI_mutex_key key_LOCK_queue) {
mysql_mutex_init(key_LOCK_queue, &m_lock, MY_MUTEX_INIT_FAST);
}
void deinit() { mysql_mutex_destroy(&m_lock); }
bool is_empty() const { return m_first == NULL; }
/**
Append a linked list of threads to the queue.
@retval true The queue was empty before this operation.
@retval false The queue was non-empty before this operation.
*/
bool append(THD *first);
/**
Fetch the entire queue for a stage.
This will fetch the entire queue in one go.
*/
THD *fetch_and_empty();
std::pair<bool, THD *> pop_front();
inline int32 get_size() { return m_size.load(); }
private:
void lock() { mysql_mutex_lock(&m_lock); }
void unlock() { mysql_mutex_unlock(&m_lock); }
/**
Pointer to the first thread in the queue, or NULL if the queue is
empty.
*/
THD *m_first;
/**
Pointer to the location holding the end of the queue.
This is either @c &first, or a pointer to the @c next_to_commit of
the last thread that is enqueued.
*/
THD **m_last;
/** size of the queue */
std::atomic<int32> m_size;
/** Lock for protecting the queue. */
mysql_mutex_t m_lock;
/*
This attribute did not have the desired effect, at least not according
to -fsanitize=undefined with gcc 5.2.1
*/
}; // MY_ATTRIBUTE((aligned(CPU_LEVEL1_DCACHE_LINESIZE)));
public:
Stage_manager() {}
~Stage_manager() {}
/**
Constants for queues for different stages.
*/
enum StageID { FLUSH_STAGE, SYNC_STAGE, COMMIT_STAGE, STAGE_COUNTER };
void init(PSI_mutex_key key_LOCK_flush_queue,
PSI_mutex_key key_LOCK_sync_queue,
PSI_mutex_key key_LOCK_commit_queue, PSI_mutex_key key_LOCK_done,
PSI_cond_key key_COND_done) {
mysql_mutex_init(key_LOCK_done, &m_lock_done, MY_MUTEX_INIT_FAST);
mysql_cond_init(key_COND_done, &m_cond_done);
#ifndef DBUG_OFF
/* reuse key_COND_done 'cos a new PSI object would be wasteful in !DBUG_OFF
*/
mysql_cond_init(key_COND_done, &m_cond_preempt);
#endif
m_queue[FLUSH_STAGE].init(key_LOCK_flush_queue);
m_queue[SYNC_STAGE].init(key_LOCK_sync_queue);
m_queue[COMMIT_STAGE].init(key_LOCK_commit_queue);
}
void deinit() {
for (size_t i = 0; i < STAGE_COUNTER; ++i) m_queue[i].deinit();
mysql_cond_destroy(&m_cond_done);
mysql_mutex_destroy(&m_lock_done);
}
/**
Enroll a set of sessions for a stage.
This will queue the session thread for writing and flushing.
If the thread being queued is assigned as stage leader, it will
return immediately.
If wait_if_follower is true the thread is not the stage leader,
the thread will be wait for the queue to be processed by the
leader before it returns.
In DBUG-ON version the follower marks is preempt status as ready.
@param stage Stage identifier for the queue to append to.
@param first Queue to append.
@param stage_mutex
Pointer to the currently held stage mutex, or NULL if
we're not in a stage.
@retval true Thread is stage leader.
@retval false Thread was not stage leader and processing has been done.
*/
bool enroll_for(StageID stage, THD *first, mysql_mutex_t *stage_mutex);
std::pair<bool, THD *> pop_front(StageID stage) {
return m_queue[stage].pop_front();
}
#ifndef DBUG_OFF
/**
The method ensures the follower's execution path can be preempted
by the leader's thread.
Preempt status of @c head follower is checked to engange the leader
into waiting when set.
@param head THD* of a follower thread
*/
void clear_preempt_status(THD *head);
#endif
/**
Fetch the entire queue and empty it.
@return Pointer to the first session of the queue.
*/
THD *fetch_queue_for(StageID stage) {
DBUG_PRINT("debug", ("Fetching queue for stage %d", stage));
return m_queue[stage].fetch_and_empty();
}
/**
Introduces a wait operation on the executing thread. The
waiting is done until the timeout elapses or count is
reached (whichever comes first).
If count == 0, then the session will wait until the timeout
elapses. If timeout == 0, then there is no waiting.
@param usec the number of microseconds to wait.
@param count wait for as many as count to join the queue the
session is waiting on
@param stage which stage queue size to compare count against.
*/
void wait_count_or_timeout(ulong count, long usec, StageID stage);
void signal_done(THD *queue);
private:
/**
Queues for sessions.
We need two queues:
- Waiting. Threads waiting to be processed
- Committing. Threads waiting to be committed.
*/
Mutex_queue m_queue[STAGE_COUNTER];
/** Condition variable to indicate that the commit was processed */
mysql_cond_t m_cond_done;
/** Mutex used for the condition variable above */
mysql_mutex_t m_lock_done;
#ifndef DBUG_OFF
/** Flag is set by Leader when it starts waiting for follower's all-clear */
bool leader_await_preempt_status;
/** Condition variable to indicate a follower started waiting for commit */
mysql_cond_t m_cond_preempt;
#endif
};
/* log info errors */
#define LOG_INFO_EOF -1
#define LOG_INFO_IO -2
#define LOG_INFO_INVALID -3
#define LOG_INFO_SEEK -4
#define LOG_INFO_MEM -6
#define LOG_INFO_FATAL -7
#define LOG_INFO_IN_USE -8
#define LOG_INFO_EMFILE -9
/* bitmap to MYSQL_BIN_LOG::close() */
#define LOG_CLOSE_INDEX 1
#define LOG_CLOSE_TO_BE_OPENED 2
#define LOG_CLOSE_STOP_EVENT 4
/*
Note that we destroy the lock mutex in the destructor here.
This means that object instances cannot be destroyed/go out of scope
until we have reset thd->current_linfo to NULL;
*/
struct LOG_INFO {
char log_file_name[FN_REFLEN];
my_off_t index_file_offset, index_file_start_offset;
my_off_t pos;
bool fatal; // if the purge happens to give us a negative offset
int entry_index; // used in purge_logs(), calculatd in find_log_pos().
LOG_INFO()
: index_file_offset(0),
index_file_start_offset(0),
pos(0),
fatal(0),
entry_index(0) {
memset(log_file_name, 0, FN_REFLEN);
}
};
/*
TODO use mmap instead of IO_CACHE for binlog
(mmap+fsync is two times faster than write+fsync)
*/
class MYSQL_BIN_LOG : public TC_LOG {
public:
class Binlog_ofile;
private:
enum enum_log_state { LOG_OPENED, LOG_CLOSED, LOG_TO_BE_OPENED };
/* LOCK_log is inited by init_pthread_objects() */
mysql_mutex_t LOCK_log;
char *name;
char log_file_name[FN_REFLEN];
char db[NAME_LEN + 1];
bool write_error, inited;
Binlog_ofile *m_binlog_file;
/** Instrumentation key to use for file io in @c log_file */
PSI_file_key m_log_file_key;
/** The instrumentation key to use for @ LOCK_log. */
PSI_mutex_key m_key_LOCK_log;
/** The instrumentation key to use for @ LOCK_index. */
PSI_mutex_key m_key_LOCK_index;
/** The instrumentation key to use for @ LOCK_binlog_end_pos. */
PSI_mutex_key m_key_LOCK_binlog_end_pos;
PSI_mutex_key m_key_COND_done;
PSI_mutex_key m_key_LOCK_commit_queue;
PSI_mutex_key m_key_LOCK_done;
PSI_mutex_key m_key_LOCK_flush_queue;
PSI_mutex_key m_key_LOCK_sync_queue;
/** The instrumentation key to use for @ LOCK_commit. */
PSI_mutex_key m_key_LOCK_commit;
/** The instrumentation key to use for @ LOCK_sync. */
PSI_mutex_key m_key_LOCK_sync;
/** The instrumentation key to use for @ LOCK_xids. */
PSI_mutex_key m_key_LOCK_xids;
/** The instrumentation key to use for @ update_cond. */
PSI_cond_key m_key_update_cond;
/** The instrumentation key to use for @ prep_xids_cond. */
PSI_cond_key m_key_prep_xids_cond;
/** The instrumentation key to use for opening the log file. */
PSI_file_key m_key_file_log;
/** The instrumentation key to use for opening the log index file. */
PSI_file_key m_key_file_log_index;
/** The instrumentation key to use for opening a log cache file. */
PSI_file_key m_key_file_log_cache;
/** The instrumentation key to use for opening a log index cache file. */
PSI_file_key m_key_file_log_index_cache;
/* POSIX thread objects are inited by init_pthread_objects() */
mysql_mutex_t LOCK_index;
mysql_mutex_t LOCK_commit;
mysql_mutex_t LOCK_sync;
mysql_mutex_t LOCK_binlog_end_pos;
mysql_mutex_t LOCK_xids;
mysql_cond_t update_cond;
std::atomic<my_off_t> atomic_binlog_end_pos;
ulonglong bytes_written;
IO_CACHE index_file;
char index_file_name[FN_REFLEN];
/*
crash_safe_index_file is temp file used for guaranteeing
index file crash safe when master server restarts.
*/
IO_CACHE crash_safe_index_file;
char crash_safe_index_file_name[FN_REFLEN];
/*
purge_file is a temp file used in purge_logs so that the index file
can be updated before deleting files from disk, yielding better crash
recovery. It is created on demand the first time purge_logs is called
and then reused for subsequent calls. It is cleaned up in cleanup().
*/
IO_CACHE purge_index_file;
char purge_index_file_name[FN_REFLEN];
/*
The max size before rotation (usable only if log_type == LOG_BIN: binary
logs and relay logs).
For a binlog, max_size should be max_binlog_size.
For a relay log, it should be max_relay_log_size if this is non-zero,
max_binlog_size otherwise.
max_size is set in init(), and dynamically changed (when one does SET
GLOBAL MAX_BINLOG_SIZE|MAX_RELAY_LOG_SIZE) by fix_max_binlog_size and
fix_max_relay_log_size).
*/
ulong max_size;
// current file sequence number for load data infile binary logging
uint file_id;
uint open_count; // For replication
/* pointer to the sync period variable, for binlog this will be
sync_binlog_period, for relay log this will be
sync_relay_log_period
*/
uint *sync_period_ptr;
uint sync_counter;
mysql_cond_t m_prep_xids_cond;
std::atomic<int32> m_atomic_prep_xids{0};
/**
Increment the prepared XID counter.
*/
void inc_prep_xids(THD *thd);
/**
Decrement the prepared XID counter.
Signal m_prep_xids_cond if the counter reaches zero.
*/
void dec_prep_xids(THD *thd);
int32 get_prep_xids() { return m_atomic_prep_xids; }
inline uint get_sync_period() { return *sync_period_ptr; }
public:
/*
This is used to start writing to a new log file. The difference from
new_file() is locking. new_file_without_locking() does not acquire
LOCK_log.
*/
int new_file_without_locking(
Format_description_log_event *extra_description_event);
private:
int new_file_impl(bool need_lock,
Format_description_log_event *extra_description_event);
/** Manage the stages in ordered_commit. */
Stage_manager stage_manager;
bool open(PSI_file_key log_file_key, const char *log_name,
const char *new_name, uint32 new_index_number);
bool init_and_set_log_file_name(const char *log_name, const char *new_name,
uint32 new_index_number);
int generate_new_name(char *new_name, const char *log_name,
uint32 new_index_number = 0);
public:
const char *generate_name(const char *log_name, const char *suffix,
char *buff);
bool is_open() { return atomic_log_state != LOG_CLOSED; }
/* This is relay log */
bool is_relay_log;
uint8 checksum_alg_reset; // to contain a new value when binlog is rotated
/*
Holds the last seen in Relay-Log FD's checksum alg value.
The initial value comes from the slave's local FD that heads
the very first Relay-Log file. In the following the value may change
with each received master's FD_m.
Besides to be used in verification events that IO thread receives
(except the 1st fake Rotate, see @c Master_info:: checksum_alg_before_fd),
the value specifies if/how to compute checksum for slave's local events
and the first fake Rotate (R_f^1) coming from the master.
R_f^1 needs logging checksum-compatibly with the RL's heading FD_s.
Legends for the checksum related comments:
FD - Format-Description event,
R - Rotate event
R_f - the fake Rotate event
E - an arbirary event
The underscore indexes for any event
`_s' indicates the event is generated by Slave
`_m' - by Master
Two special underscore indexes of FD:
FD_q - Format Description event for queuing (relay-logging)
FD_e - Format Description event for executing (relay-logging)
Upper indexes:
E^n - n:th event is a sequence
RL - Relay Log
(A) - checksum algorithm descriptor value
FD.(A) - the value of (A) in FD
*/
binary_log::enum_binlog_checksum_alg relay_log_checksum_alg;
MYSQL_BIN_LOG(uint *sync_period);
~MYSQL_BIN_LOG();
void set_psi_keys(
PSI_mutex_key key_LOCK_index, PSI_mutex_key key_LOCK_commit,
PSI_mutex_key key_LOCK_commit_queue, PSI_mutex_key key_LOCK_done,
PSI_mutex_key key_LOCK_flush_queue, PSI_mutex_key key_LOCK_log,
PSI_mutex_key key_LOCK_binlog_end_pos, PSI_mutex_key key_LOCK_sync,
PSI_mutex_key key_LOCK_sync_queue, PSI_mutex_key key_LOCK_xids,
PSI_cond_key key_COND_done, PSI_cond_key key_update_cond,
PSI_cond_key key_prep_xids_cond, PSI_file_key key_file_log,
PSI_file_key key_file_log_index, PSI_file_key key_file_log_cache,
PSI_file_key key_file_log_index_cache) {
m_key_COND_done = key_COND_done;
m_key_LOCK_commit_queue = key_LOCK_commit_queue;
m_key_LOCK_done = key_LOCK_done;
m_key_LOCK_flush_queue = key_LOCK_flush_queue;
m_key_LOCK_sync_queue = key_LOCK_sync_queue;
m_key_LOCK_index = key_LOCK_index;
m_key_LOCK_log = key_LOCK_log;
m_key_LOCK_binlog_end_pos = key_LOCK_binlog_end_pos;
m_key_LOCK_commit = key_LOCK_commit;
m_key_LOCK_sync = key_LOCK_sync;
m_key_LOCK_xids = key_LOCK_xids;
m_key_update_cond = key_update_cond;
m_key_prep_xids_cond = key_prep_xids_cond;
m_key_file_log = key_file_log;
m_key_file_log_index = key_file_log_index;
m_key_file_log_cache = key_file_log_cache;
m_key_file_log_index_cache = key_file_log_index_cache;
}
public:
/** Manage the MTS dependency tracking */
Transaction_dependency_tracker m_dependency_tracker;
/**
Find the oldest binary log that contains any GTID that
is not in the given gtid set.
@param[out] binlog_file_name the file name of oldest binary log found
@param[in] gtid_set the given gtid set
@param[out] first_gtid the first GTID information from the binary log
file returned at binlog_file_name
@param[out] errmsg the error message outputted, which is left untouched
if the function returns false
@return false on success, true on error.
*/
bool find_first_log_not_in_gtid_set(char *binlog_file_name,
const Gtid_set *gtid_set,
Gtid *first_gtid, const char **errmsg);
/**
Reads the set of all GTIDs in the binary/relay log, and the set
of all lost GTIDs in the binary log, and stores each set in
respective argument.
@param gtid_set Will be filled with all GTIDs in this binary/relay
log.
@param lost_groups Will be filled with all GTIDs in the
Previous_gtids_log_event of the first binary log that has a
Previous_gtids_log_event. This is requested to binary logs but not
to relay logs.
@param verify_checksum If true, checksums will be checked.
@param need_lock If true, LOCK_log, LOCK_index, and
global_sid_lock->wrlock are acquired; otherwise they are asserted
to be taken already.
@param [out] trx_parser This will be used to return the actual
relaylog transaction parser state because of the possibility
of partial transactions.
@param [out] partial_trx If a transaction was left incomplete
on the relaylog, its GTID information should be returned to be
used in the case of the rest of the transaction be added to the
relaylog.
@param is_server_starting True if the server is starting.
@return false on success, true on error.
*/
bool init_gtid_sets(Gtid_set *gtid_set, Gtid_set *lost_groups,
bool verify_checksum, bool need_lock,
Transaction_boundary_parser *trx_parser,
Gtid_monitoring_info *partial_trx,
bool is_server_starting = false);
void set_previous_gtid_set_relaylog(Gtid_set *previous_gtid_set_param) {
DBUG_ASSERT(is_relay_log);
previous_gtid_set_relaylog = previous_gtid_set_param;
}
/**
If the thread owns a GTID, this function generates an empty
transaction and releases ownership of the GTID.
- If the binary log is disabled for this thread, the GTID is
inserted directly into the mysql.gtid_executed table and the
GTID is included in @@global.gtid_executed. (This only happens
for DDL, since DML will save the GTID into table and release
ownership inside ha_commit_trans.)
- If the binary log is enabled for this thread, an empty
transaction consisting of GTID, BEGIN, COMMIT is written to the
binary log, the GTID is included in @@global.gtid_executed, and
the GTID is added to the mysql.gtid_executed table on the next
binlog rotation.
This function must be called by any committing statement (COMMIT,
implicitly committing statements, or Xid_log_event), after the
statement has completed execution, regardless of whether the
statement updated the database.
This logic ensures that an empty transaction is generated for the
following cases:
- Explicit empty transaction:
SET GTID_NEXT = 'UUID:NUMBER'; BEGIN; COMMIT;
- Transaction or DDL that gets completely filtered out in the
slave thread.
@param thd The committing thread
@retval 0 Success
@retval nonzero Error
*/
int gtid_end_transaction(THD *thd);
private:
std::atomic<enum_log_state> atomic_log_state{LOG_CLOSED};
/* The previous gtid set in relay log. */
Gtid_set *previous_gtid_set_relaylog;
int open(const char *opt_name) { return open_binlog(opt_name); }
bool change_stage(THD *thd, Stage_manager::StageID stage, THD *queue,
mysql_mutex_t *leave, mysql_mutex_t *enter);
std::pair<int, my_off_t> flush_thread_caches(THD *thd);
int flush_cache_to_file(my_off_t *flush_end_pos);
int finish_commit(THD *thd);
std::pair<bool, bool> sync_binlog_file(bool force);
void process_commit_stage_queue(THD *thd, THD *queue);
void process_after_commit_stage_queue(THD *thd, THD *first);
int process_flush_stage_queue(my_off_t *total_bytes_var, bool *rotate_var,
THD **out_queue_var);
int ordered_commit(THD *thd, bool all, bool skip_commit = false);
void handle_binlog_flush_or_sync_error(THD *thd, bool need_lock_log);
bool do_write_cache(Binlog_cache_storage *cache,
class Binlog_event_writer *writer);
void report_binlog_write_error();
public:
int open_binlog(const char *opt_name);
void close();
enum_result commit(THD *thd, bool all);
int rollback(THD *thd, bool all);
bool truncate_relaylog_file(Master_info *mi, my_off_t valid_pos);
int prepare(THD *thd, bool all);
#if defined(MYSQL_SERVER)
void update_thd_next_event_pos(THD *thd);
int flush_and_set_pending_rows_event(THD *thd, Rows_log_event *event,
bool is_transactional);
#endif /* defined(MYSQL_SERVER) */
void add_bytes_written(ulonglong inc) { bytes_written += inc; }
void reset_bytes_written() { bytes_written = 0; }
void harvest_bytes_written(ulonglong *counter) {
#ifndef DBUG_OFF
char buf1[22], buf2[22];
#endif
DBUG_ENTER("harvest_bytes_written");
(*counter) += bytes_written;
DBUG_PRINT("info", ("counter: %s bytes_written: %s", llstr(*counter, buf1),
llstr(bytes_written, buf2)));
bytes_written = 0;
DBUG_VOID_RETURN;
}
void set_max_size(ulong max_size_arg);
void signal_update() {
DBUG_ENTER("MYSQL_BIN_LOG::signal_update");
mysql_cond_broadcast(&update_cond);
DBUG_VOID_RETURN;
}
void update_binlog_end_pos(bool need_lock = true);
void update_binlog_end_pos(my_off_t pos);
int wait_for_update(const struct timespec *timeout);
public:
void init_pthread_objects();
void cleanup();
/**
Create a new binary log.
@param log_name Name of binlog
@param new_name Name of binlog, too. todo: what's the difference
between new_name and log_name?
@param max_size_arg The size at which this binlog will be rotated.
@param null_created_arg If false, and a Format_description_log_event
is written, then the Format_description_log_event will have the
timestamp 0. Otherwise, it the timestamp will be the time when the
event was written to the log.
@param need_lock_index If true, LOCK_index is acquired; otherwise
LOCK_index must be taken by the caller.
@param need_sid_lock If true, the read lock on global_sid_lock
will be acquired. Otherwise, the caller must hold the read lock
on global_sid_lock.
@param extra_description_event The master's FDE to be written by the I/O
thread while creating a new relay log file. This should be NULL for
binary log files.
@param new_index_number The binary log file index number to start from
after the RESET MASTER TO command is called.
*/
bool open_binlog(const char *log_name, const char *new_name,
ulong max_size_arg, bool null_created_arg,
bool need_lock_index, bool need_sid_lock,
Format_description_log_event *extra_description_event,
uint32 new_index_number = 0);
bool open_index_file(const char *index_file_name_arg, const char *log_name,
bool need_lock_index);
/* Use this to start writing a new log file */
int new_file(Format_description_log_event *extra_description_event);
bool write_event(Log_event *event_info);
bool write_cache(THD *thd, class binlog_cache_data *cache_data,
class Binlog_event_writer *writer);
/**
Assign automatic generated GTIDs for all commit group threads in the flush
stage having gtid_next.type == AUTOMATIC_GTID.
@param first_seen The first thread seen entering the flush stage.
@return Returns false if succeeds, otherwise true is returned.
*/
bool assign_automatic_gtids_to_flush_group(THD *first_seen);
bool write_gtid(THD *thd, binlog_cache_data *cache_data,
class Binlog_event_writer *writer);
/**
Write a dml into statement cache and then flush it into binlog. It writes
Gtid_log_event and BEGIN, COMMIT automatically.
It is aimed to handle cases of "background" logging where a statement is
logged indirectly, like "DELETE FROM a_memory_table". So don't use it on
any normal statement.
@param[in] thd the THD object of current thread.
@param[in] stmt the DELETE statement.
@param[in] stmt_len the length of DELETE statement.
@return Returns false if succeeds, otherwise true is returned.
*/
bool write_dml_directly(THD *thd, const char *stmt, size_t stmt_len);
void report_cache_write_error(THD *thd, bool is_transactional);
bool check_write_error(THD *thd);
bool write_incident(THD *thd, bool need_lock_log, const char *err_msg,
bool do_flush_and_sync = true);
bool write_incident(Incident_log_event *ev, THD *thd, bool need_lock_log,
const char *err_msg, bool do_flush_and_sync = true);
bool write_event_to_binlog(Log_event *ev);
bool write_event_to_binlog_and_flush(Log_event *ev);
bool write_event_to_binlog_and_sync(Log_event *ev);
void start_union_events(THD *thd, query_id_t query_id_param);
void stop_union_events(THD *thd);
bool is_query_in_union(THD *thd, query_id_t query_id_param);
bool write_buffer(const char *buf, uint len, Master_info *mi);
bool write_event(Log_event *ev, Master_info *mi);
private:
bool after_write_to_relay_log(Master_info *mi);
public:
void make_log_name(char *buf, const char *log_ident);
bool is_active(const char *log_file_name);
int remove_logs_from_index(LOG_INFO *linfo, bool need_update_threads);
int rotate(bool force_rotate, bool *check_purge);
void purge();
int rotate_and_purge(THD *thd, bool force_rotate);
bool flush();
/**
Flush binlog cache and synchronize to disk.
This function flushes events in binlog cache to binary log file,
it will do synchronizing according to the setting of system
variable 'sync_binlog'. If file is synchronized, @c synced will
be set to 1, otherwise 0.
@param[in] force if true, ignores the 'sync_binlog' and synchronizes the
file.
@retval 0 Success
@retval other Failure
*/
bool flush_and_sync(const bool force = false);
int purge_logs(const char *to_log, bool included, bool need_lock_index,
bool need_update_threads, ulonglong *decrease_log_space,
bool auto_purge);
int purge_logs_before_date(time_t purge_time, bool auto_purge);
int set_crash_safe_index_file_name(const char *base_file_name);
int open_crash_safe_index_file();
int close_crash_safe_index_file();
int add_log_to_index(uchar *log_file_name, size_t name_len,
bool need_lock_index);
int move_crash_safe_index_file_to_index_file(bool need_lock_index);
int set_purge_index_file_name(const char *base_file_name);
int open_purge_index_file(bool destroy);
bool is_inited_purge_index_file();
int close_purge_index_file();
int sync_purge_index_file();
int register_purge_index_entry(const char *entry);
int register_create_index_entry(const char *entry);
int purge_index_entry(THD *thd, ulonglong *decrease_log_space,
bool need_lock_index);
bool reset_logs(THD *thd, bool delete_only = false);
void close(uint exiting, bool need_lock_log, bool need_lock_index);
// iterating through the log index file
int find_log_pos(LOG_INFO *linfo, const char *log_name, bool need_lock_index);
int find_next_log(LOG_INFO *linfo, bool need_lock_index);
int find_next_relay_log(char log_name[FN_REFLEN + 1]);
int get_current_log(LOG_INFO *linfo, bool need_lock_log = true);
int raw_get_current_log(LOG_INFO *linfo);
uint next_file_id();
inline char *get_index_fname() { return index_file_name; }
inline char *get_log_fname() { return log_file_name; }
inline char *get_name() { return name; }
inline mysql_mutex_t *get_log_lock() { return &LOCK_log; }
inline mysql_cond_t *get_log_cond() { return &update_cond; }
inline Binlog_ofile *get_binlog_file() { return m_binlog_file; }
inline void lock_index() { mysql_mutex_lock(&LOCK_index); }
inline void unlock_index() { mysql_mutex_unlock(&LOCK_index); }
inline IO_CACHE *get_index_file() { return &index_file; }
inline uint32 get_open_count() { return open_count; }
/*
It is called by the threads (e.g. dump thread, applier thread) which want
to read hot log without LOCK_log protection.
*/
my_off_t get_binlog_end_pos() const {
mysql_mutex_assert_not_owner(&LOCK_log);
return atomic_binlog_end_pos;
}
mysql_mutex_t *get_binlog_end_pos_lock() { return &LOCK_binlog_end_pos; }
void lock_binlog_end_pos() { mysql_mutex_lock(&LOCK_binlog_end_pos); }
void unlock_binlog_end_pos() { mysql_mutex_unlock(&LOCK_binlog_end_pos); }
/**
Deep copy global_sid_map and gtid_executed.
Both operations are done under LOCK_commit and global_sid_lock
protection.
@param[out] sid_map The Sid_map to which global_sid_map will
be copied.
@param[out] gtid_set The Gtid_set to which gtid_executed will
be copied.
@return the operation status
@retval 0 OK
@retval !=0 Error
*/
int get_gtid_executed(Sid_map *sid_map, Gtid_set *gtid_set);
/*
True while rotating binlog, which is caused by logging Incident_log_event.
*/
bool is_rotating_caused_by_incident;
};
struct LOAD_FILE_INFO {
THD *thd;
my_off_t last_pos_in_file;
bool logged_data_file, log_delayed;
};
extern MYSQL_PLUGIN_IMPORT MYSQL_BIN_LOG mysql_bin_log;
/**
Check if at least one of transacaction and statement binlog caches contains
an empty transaction, other one is empty or contains an empty transaction,
which has two binlog events "BEGIN" and "COMMIT".
@param thd The client thread that executed the current statement.
@retval true At least one of transacaction and statement binlog caches
contains an empty transaction, other one is empty or
contains an empty transaction.
@retval false Otherwise.
*/
bool is_empty_transaction_in_binlog_cache(const THD *thd);
bool trans_has_updated_trans_table(const THD *thd);
bool stmt_has_updated_trans_table(Ha_trx_info *ha_list);
bool ending_trans(THD *thd, const bool all);
bool ending_single_stmt_trans(THD *thd, const bool all);
bool trans_cannot_safely_rollback(const THD *thd);
bool stmt_cannot_safely_rollback(const THD *thd);
int log_loaded_block(IO_CACHE *file);
bool purge_master_logs(THD *thd, const char *to_log);
bool purge_master_logs_before_date(THD *thd, time_t purge_time);
bool show_binlog_events(THD *thd, MYSQL_BIN_LOG *binary_log);
bool mysql_show_binlog_events(THD *thd);
void check_binlog_cache_size(THD *thd);
void check_binlog_stmt_cache_size(THD *thd);
bool binlog_enabled();
void register_binlog_handler(THD *thd, bool trx);
int query_error_code(THD *thd, bool not_killed);
extern const char *log_bin_index;
extern const char *log_bin_basename;
extern bool opt_binlog_order_commits;
extern ulong rpl_read_size;
/**
Turns a relative log binary log path into a full path, based on the
opt_bin_logname or opt_relay_logname. Also trims the cr-lf at the
end of the full_path before return to avoid any server startup
problem on windows.
@param from The log name we want to make into an absolute path.
@param to The buffer where to put the results of the
normalization.
@param is_relay_log Switch that makes is used inside to choose which
option (opt_bin_logname or opt_relay_logname) to
use when calculating the base path.
@returns true if a problem occurs, false otherwise.
*/
bool normalize_binlog_name(char *to, const char *from, bool is_relay_log);
#endif /* BINLOG_H_INCLUDED */