Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
M
MariaDB
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
nexedi
MariaDB
Commits
ff3e4bd9
Commit
ff3e4bd9
authored
Jun 29, 2007
by
unknown
Browse files
Options
Browse Files
Download
Plain Diff
Merge bk-internal.mysql.com:/home/bk/mysql-maria
into janus.mylan:/usr/home/serg/Abk/mysql-maria
parents
79d36c8e
34d15a59
Changes
31
Hide whitespace changes
Inline
Side-by-side
Showing
31 changed files
with
1366 additions
and
377 deletions
+1366
-377
mysys/Makefile.am
mysys/Makefile.am
+1
-1
storage/maria/Makefile.am
storage/maria/Makefile.am
+7
-1
storage/maria/ha_maria.cc
storage/maria/ha_maria.cc
+1
-1
storage/maria/ma_blockrec.c
storage/maria/ma_blockrec.c
+21
-9
storage/maria/ma_check.c
storage/maria/ma_check.c
+21
-7
storage/maria/ma_checkpoint.h
storage/maria/ma_checkpoint.h
+57
-10
storage/maria/ma_close.c
storage/maria/ma_close.c
+1
-0
storage/maria/ma_control_file.c
storage/maria/ma_control_file.c
+18
-22
storage/maria/ma_control_file.h
storage/maria/ma_control_file.h
+7
-16
storage/maria/ma_create.c
storage/maria/ma_create.c
+112
-74
storage/maria/ma_delete_all.c
storage/maria/ma_delete_all.c
+31
-36
storage/maria/ma_delete_table.c
storage/maria/ma_delete_table.c
+5
-4
storage/maria/ma_loghandler.c
storage/maria/ma_loghandler.c
+127
-139
storage/maria/ma_loghandler.h
storage/maria/ma_loghandler.h
+115
-0
storage/maria/ma_loghandler_lsn.h
storage/maria/ma_loghandler_lsn.h
+23
-3
storage/maria/ma_open.c
storage/maria/ma_open.c
+12
-0
storage/maria/ma_pagecache.c
storage/maria/ma_pagecache.c
+9
-16
storage/maria/ma_recovery.h
storage/maria/ma_recovery.h
+1
-1
storage/maria/ma_rename.c
storage/maria/ma_rename.c
+7
-9
storage/maria/ma_test1.c
storage/maria/ma_test1.c
+1
-1
storage/maria/ma_test2.c
storage/maria/ma_test2.c
+1
-1
storage/maria/maria_chk.c
storage/maria/maria_chk.c
+7
-0
storage/maria/maria_def.h
storage/maria/maria_def.h
+3
-2
storage/maria/maria_read_log.c
storage/maria/maria_read_log.c
+748
-0
storage/maria/trnman_public.h
storage/maria/trnman_public.h
+4
-0
storage/maria/unittest/ma_control_file-t.c
storage/maria/unittest/ma_control_file-t.c
+12
-11
storage/maria/unittest/ma_test_loghandler-t.c
storage/maria/unittest/ma_test_loghandler-t.c
+5
-5
storage/maria/unittest/ma_test_loghandler_multigroup-t.c
storage/maria/unittest/ma_test_loghandler_multigroup-t.c
+5
-5
storage/maria/unittest/ma_test_loghandler_multithread-t.c
storage/maria/unittest/ma_test_loghandler_multithread-t.c
+2
-2
storage/maria/unittest/ma_test_loghandler_pagecache-t.c
storage/maria/unittest/ma_test_loghandler_pagecache-t.c
+1
-1
storage/myisam/mi_close.c
storage/myisam/mi_close.c
+1
-0
No files found.
mysys/Makefile.am
View file @
ff3e4bd9
...
...
@@ -20,7 +20,7 @@ INCLUDES = @ZLIB_INCLUDES@ -I$(top_builddir)/include \
-I
$(top_srcdir)
/include
-I
$(srcdir)
pkglib_LIBRARIES
=
libmysys.a
LDADD
=
libmysys.a
$(top_builddir)
/strings/libmystrings.a
$(top_builddir)
/dbug/libdbug.a
noinst_HEADERS
=
mysys_priv.h my_static.h
noinst_HEADERS
=
mysys_priv.h my_static.h
my_safehash.h
libmysys_a_SOURCES
=
my_init.c my_getwd.c mf_getdate.c my_mmap.c
\
mf_path.c mf_loadpath.c my_file.c
\
my_open.c my_create.c my_dup.c my_seek.c my_read.c
\
...
...
storage/maria/Makefile.am
View file @
ff3e4bd9
...
...
@@ -33,7 +33,7 @@ SUBDIRS = . unittest
EXTRA_DIST
=
ma_test_all.sh ma_test_all.res ma_ft_stem.c CMakeLists.txt plug.in
pkgdata_DATA
=
ma_test_all ma_test_all.res
pkglib_LIBRARIES
=
libmaria.a
bin_PROGRAMS
=
maria_chk maria_pack maria_ftdump
bin_PROGRAMS
=
maria_chk maria_pack maria_ftdump
maria_read_log
maria_chk_DEPENDENCIES
=
$(LIBRARIES)
# Only reason to link with libmyisam.a here is that it's where some fulltext
# pieces are (but soon we'll remove fulltext dependencies from Maria).
...
...
@@ -49,6 +49,12 @@ maria_pack_LDADD= @CLIENT_EXTRA_LDFLAGS@ libmaria.a \
$(top_builddir)
/mysys/libmysys.a
\
$(top_builddir)
/dbug/libdbug.a
\
$(top_builddir)
/strings/libmystrings.a @ZLIB_LIBS@
maria_read_log_DEPENDENCIES
=
$(LIBRARIES)
maria_read_log_LDADD
=
@CLIENT_EXTRA_LDFLAGS@ libmaria.a
\
$(top_builddir)
/storage/myisam/libmyisam.a
\
$(top_builddir)
/mysys/libmysys.a
\
$(top_builddir)
/dbug/libdbug.a
\
$(top_builddir)
/strings/libmystrings.a @ZLIB_LIBS@
noinst_PROGRAMS
=
ma_test1 ma_test2 ma_test3 ma_rt_test ma_sp_test
noinst_HEADERS
=
maria_def.h ma_rt_index.h ma_rt_key.h ma_rt_mbr.h
\
ma_sp_defs.h ma_fulltext.h ma_ftdefs.h ma_ft_test1.h
\
...
...
storage/maria/ha_maria.cc
View file @
ff3e4bd9
...
...
@@ -2241,7 +2241,7 @@ static int ha_maria_init(void *p)
maria_hton
->
flags
=
HTON_CAN_RECREATE
|
HTON_SUPPORT_LOG_TABLES
;
bzero
(
maria_log_pagecache
,
sizeof
(
*
maria_log_pagecache
));
maria_data_root
=
mysql_real_data_home
;
res
=
maria_init
()
||
ma_control_file_create_or_open
()
||
res
=
maria_init
()
||
ma_control_file_create_or_open
(
TRUE
)
||
(
init_pagecache
(
maria_log_pagecache
,
TRANSLOG_PAGECACHE_SIZE
,
0
,
0
,
TRANSLOG_PAGE_SIZE
)
==
0
)
||
...
...
storage/maria/ma_blockrec.c
View file @
ff3e4bd9
...
...
@@ -557,7 +557,8 @@ static my_bool check_if_zero(byte *pos, uint length)
SYNOPSIS
_ma_unpin_all_pages()
info Maria handler
undo_lsn LSN for undo pages. 0 if we shouldn't write undo (error)
undo_lsn LSN for undo pages. LSN_IMPOSSIBLE if we shouldn't write undo
(error)
NOTE
We unpin pages in the reverse order as they where pinned; This may not
...
...
@@ -580,14 +581,15 @@ void _ma_unpin_all_pages(MARIA_HA *info, LSN undo_lsn)
DBUG_PRINT
(
"info"
,
(
"undo_lsn: %lu"
,
(
ulong
)
undo_lsn
));
/* True if not disk error */
DBUG_ASSERT
(
undo_lsn
!=
0
||
!
info
->
s
->
base
.
transactional
);
DBUG_ASSERT
(
(
undo_lsn
!=
LSN_IMPOSSIBLE
)
||
!
info
->
s
->
base
.
transactional
);
if
(
!
info
->
s
->
base
.
transactional
)
{
/*
If this is a transactional table but with transactionality temporarily
disabled (like in ALTER TABLE) we need to give a sensible LSN to pages
and not 0. If this is not a transactional table it will reduce to 0.
and not LSN_IMPOSSIBLE. If this is not a transactional table it will
reduce to LSN_IMPOSSIBLE.
*/
undo_lsn
=
info
->
s
->
state
.
create_rename_lsn
;
}
...
...
@@ -1958,8 +1960,8 @@ static my_bool write_block_record(MARIA_HA *info,
size_t
data_length
=
(
size_t
)
(
data
-
row_pos
->
data
);
/* Log REDO changes of head page */
page_store
(
log_data
+
FILEID_STORE_SIZE
,
head_block
->
page
);
dirpos_store
(
log_data
+
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
,
page_store
(
log_data
+
FILEID_STORE_SIZE
,
head_block
->
page
);
dirpos_store
(
log_data
+
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
,
row_pos
->
rownr
);
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
str
=
(
char
*
)
log_data
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
length
=
sizeof
(
log_data
);
...
...
@@ -2183,12 +2185,22 @@ static my_bool write_block_record(MARIA_HA *info,
disk_err:
/**
@todo RECOVERY we are going to let dirty pages go to disk while we have
logged UNDO, this violates WAL.
If we have not written any full pages,
all dirty pages are pinned so we could just delete them from the
pagecache. Moreover,
we have written some REDOs without a closing UNDO,
logged UNDO, this violates WAL.
We must mark the table corrupted!
@todo RECOVERY
we have written some REDOs without a closing UNDO,
it's possible that a next operation by this transaction succeeds and then
Recovery would glue the "orphan REDOs" to the succeeded operation and
execute the failed REDOs.
execute the failed REDOs. We need some mark "abort this group" in the
log, or mark the table corrupted (then user will repair it and thus REDOs
will be skipped).
@todo RECOVERY to not let write errors go unnoticed, pagecache_write()
should take a MARIA_HA* in argument, and it it
fails when flushing a page to disk it should call
(*the_maria_ha->write_error_func)(the_maria_ha)
and this hook will mark the table corrupted.
Maybe hook should be stored in the pagecache's block structure, or in a
hash "file->maria_ha*".
*/
/* Unpin all pinned pages to not cause problems for disk cache */
_ma_unpin_all_pages
(
info
,
0
);
...
...
storage/maria/ma_check.c
View file @
ff3e4bd9
...
...
@@ -5176,7 +5176,23 @@ int _ma_repair_write_log_record(const HA_CHECK *param, MARIA_HA *info)
/* Only called from ha_maria.cc, not maria_check, so translog is inited */
if
(
share
->
base
.
transactional
&&
!
share
->
temporary
)
{
/* For now this record is only informative */
/*
For now this record is only informative. It could serve when applying
logs to a backup, but that needs more thought. Assume table became
corrupted. It is repaired, then some writes happen to it.
Later we restore an old backup, and want to apply this REDO_REPAIR_TABLE
record. For it to give the same result as originally, the table should
be corrupted the same way, so applying previous REDOs should produce the
same corruption; that's really not guaranteed (different execution paths
in execution of REDOs vs runtime code so not same bugs hit, temporary
hardware issues not repeatable etc). Corruption may not be repeatable.
A reasonable solution is to execute the REDO_REPAIR_TABLE record and
check if the checksum of the resulting table matches what it was at the
end of the original repair (should be stored in log record); or execute
the REDO_REPAIR_TABLE if the checksum of the table-before-repair matches
was it was at the start of the original repair (should be stored in log
record).
*/
LEX_STRING
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
];
uchar
log_data
[
LSN_STORE_SIZE
];
compile_time_assert
(
LSN_STORE_SIZE
>=
(
FILEID_STORE_SIZE
+
4
));
...
...
@@ -5193,19 +5209,17 @@ int _ma_repair_write_log_record(const HA_CHECK *param, MARIA_HA *info)
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
length
,
sizeof
(
log_array
)
/
sizeof
(
log_array
[
0
]),
log_array
,
log_data
)))
log_array
,
log_data
)
||
translog_flush
(
share
->
state
.
create_rename_lsn
)))
return
1
;
/*
But this piece is really needed, to have the new table's content durable
and to not apply old REDOs to the new table. The table's existence was
made durable earlier (MY_SYNC_DIR passed to maria_change_to_newfile()).
*/
lsn_store
(
log_data
,
share
->
state
.
create_rename_lsn
);
DBUG_ASSERT
(
info
->
dfile
.
file
>=
0
);
DBUG_ASSERT
(
share
->
kfile
.
file
>=
0
);
return
(
my_pwrite
(
share
->
kfile
.
file
,
log_data
,
sizeof
(
log_data
),
sizeof
(
share
->
state
.
header
)
+
2
,
MYF
(
MY_NABP
))
||
_ma_sync_table_files
(
info
));
return
_ma_update_create_rename_lsn_on_disk
(
share
,
FALSE
)
||
_ma_sync_table_files
(
info
);
}
return
0
;
}
storage/maria/ma_checkpoint.h
View file @
ff3e4bd9
/* Copyright (C) 2006
MySQL AB & MySQL Finland AB & TCX DataKonsult
AB
/* Copyright (C) 2006
,2007 MySQL
AB
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
...
...
@@ -21,14 +21,61 @@
/* This is the interface of this module. */
typedef
enum
enum_checkpoint_level
{
NONE
=-
1
,
INDIRECT
,
/* just write dirty_pages, transactions table and sync files */
MEDIUM
,
/* also flush all dirty pages which were already dirty at prev checkpoint*/
FULL
/* also flush all dirty pages */
typedef
enum
enum_ma_checkpoint_level
{
CHECKPOINT_NONE
=
0
,
/* just write dirty_pages, transactions table and sync files */
CHECKPOINT_INDIRECT
,
/* also flush all dirty pages which were already dirty at prev checkpoint */
CHECKPOINT_MEDIUM
,
/* also flush all dirty pages */
CHECKPOINT_FULL
}
CHECKPOINT_LEVEL
;
void
request_asynchronous_checkpoint
(
CHECKPOINT_LEVEL
level
);
my_bool
execute_synchronous_checkpoint
(
CHECKPOINT_LEVEL
level
);
my_bool
execute_asynchronous_checkpoint_if_any
();
/* that's all that's needed in the interface */
C_MODE_START
int
ma_checkpoint_init
();
void
ma_checkpoint_end
();
int
ma_checkpoint_execute
(
CHECKPOINT_LEVEL
level
,
my_bool
no_wait
);
C_MODE_END
/**
@brief reads some LSNs with special trickery
If a 64-bit variable transitions between both halves being zero to both
halves being non-zero, and back, this function can be used to do a read of
it (without mutex, without atomic load) which always produces a correct
(though maybe slightly old) value (even on 32-bit CPUs). The value is at
least as new as the latest mutex unlock done by the calling thread.
The assumption is that the system sets both 4-byte halves either at the
same time, or one after the other (in any order), but NOT some bytes of the
first half then some bytes of the second half then the rest of bytes of the
first half. With this assumption, the function can detect when it is
seeing an inconsistent value.
@param LSN pointer to the LSN variable to read
@return LSN part (most significant byte always 0)
*/
#if ( SIZEOF_CHARP >= 8 )
/* 64-bit CPU, 64-bit reads are atomic */
#define lsn_read_non_atomic LSN_WITH_FLAGS_TO_LSN
#else
static
inline
LSN
lsn_read_non_atomic_32
(
const
volatile
LSN
*
x
)
{
/*
32-bit CPU, 64-bit reads may give a mixed of old half and new half (old
low bits and new high bits, or the contrary).
*/
for
(;;)
/* loop until no atomicity problems */
{
/*
Remove most significant byte in case this is a LSN_WITH_FLAGS object.
Those flags in TRN::first_undo_lsn break the condition on transitions so
they must be removed below.
*/
LSN
y
=
LSN_WITH_FLAGS_TO_LSN
(
*
x
);
if
(
likely
((
y
==
LSN_IMPOSSIBLE
)
||
LSN_VALID
(
y
)))
return
y
;
}
}
#define lsn_read_non_atomic(x) lsn_read_non_atomic_32(&x)
#endif
storage/maria/ma_close.c
View file @
ff3e4bd9
...
...
@@ -85,6 +85,7 @@ int maria_close(register MARIA_HA *info)
not change the crashed state.
We can NOT write the state in other cases as other threads
may be using the file at this point
IF using --external-locking, which does not apply to Maria.
*/
if
(
share
->
mode
!=
O_RDONLY
&&
maria_is_crashed
(
info
))
_ma_state_info_write
(
share
->
kfile
.
file
,
&
share
->
state
,
1
);
...
...
storage/maria/ma_control_file.c
View file @
ff3e4bd9
...
...
@@ -40,15 +40,9 @@
#define CONTROL_FILE_FILENO_SIZE 4
#define CONTROL_FILE_SIZE (CONTROL_FILE_FILENO_OFFSET + CONTROL_FILE_FILENO_SIZE)
/*
This module owns these two vars.
uint32 is always atomically updated, but LSN is 8 bytes, we will need
provisions to ensure that it's updated atomically in
ma_control_file_write_and_force(). Probably the log mutex could be
used. TODO.
*/
LSN
last_checkpoint_lsn
;
uint32
last_logno
;
/* This module owns these two vars. */
LSN
last_checkpoint_lsn
=
LSN_IMPOSSIBLE
;
uint32
last_logno
=
FILENO_IMPOSSIBLE
;
/**
@brief If log's lock should be asserted when writing to control file.
...
...
@@ -65,16 +59,16 @@ my_bool maria_multi_threaded= FALSE;
static
int
control_file_fd
=
-
1
;
/*
Initialize control file subsystem
SYNOPSIS
ma_control_file_create_or_open()
@brief Initialize control file subsystem
Looks for the control file. If
absent, it's a fresh start
, creates file.
Looks for the control file. If
none and creation is requested
, creates file.
If present, reads it to find out last checkpoint's LSN and last log, updates
the last_checkpoint_lsn and last_logno global variables.
Called at engine's start.
@param create_if_missing
@note
The format of the control file is:
4 bytes: magic string
4 bytes: checksum of the following bytes
...
...
@@ -82,11 +76,11 @@ static int control_file_fd= -1;
4 bytes: offset in log where last checkpoint is
4 bytes: number of last log
RETURN
0 -
OK
1 -
Error (in which case the file is left closed)
@return Operation status
@retval 0
OK
@retval 1
Error (in which case the file is left closed)
*/
CONTROL_FILE_ERROR
ma_control_file_create_or_open
()
CONTROL_FILE_ERROR
ma_control_file_create_or_open
(
my_bool
create_if_missing
)
{
char
buffer
[
CONTROL_FILE_SIZE
];
char
name
[
FN_REFLEN
];
...
...
@@ -115,6 +109,8 @@ CONTROL_FILE_ERROR ma_control_file_create_or_open()
if
(
create_file
)
{
if
(
!
create_if_missing
)
DBUG_RETURN
(
CONTROL_FILE_MISSING
);
if
((
control_file_fd
=
my_create
(
name
,
0
,
open_flags
,
MYF
(
MY_SYNC_DIR
)))
<
0
)
DBUG_RETURN
(
CONTROL_FILE_UNKNOWN_ERROR
);
...
...
@@ -136,8 +132,8 @@ CONTROL_FILE_ERROR ma_control_file_create_or_open()
*/
/* init the file with these "undefined" values */
DBUG_RETURN
(
ma_control_file_write_and_force
(
CONTROL_FILE_IMPOSSIBLE_LSN
,
CONTROL_FILE_IMPOSSIBLE_FILENO
,
DBUG_RETURN
(
ma_control_file_write_and_force
(
LSN_IMPOSSIBLE
,
FILENO_IMPOSSIBLE
,
CONTROL_FILE_UPDATE_ALL
));
}
...
...
@@ -315,8 +311,8 @@ int ma_control_file_end()
As this module owns these variables, closing the module forbids access to
them (just a safety):
*/
last_checkpoint_lsn
=
CONTROL_FILE_IMPOSSIBLE_LSN
;
last_logno
=
CONTROL_FILE_IMPOSSIBLE_FILENO
;
last_checkpoint_lsn
=
LSN_IMPOSSIBLE
;
last_logno
=
FILENO_IMPOSSIBLE
;
DBUG_RETURN
(
close_error
);
}
storage/maria/ma_control_file.h
View file @
ff3e4bd9
...
...
@@ -19,27 +19,17 @@
*/
#define CONTROL_FILE_BASE_NAME "maria_control"
/*
indicate absence of the log file number; first log is always number 1, 0 is
impossible.
*/
#define CONTROL_FILE_IMPOSSIBLE_FILENO 0
/* logs always have a header */
#define CONTROL_FILE_IMPOSSIBLE_LOG_OFFSET 0
/* indicate absence of LSN. */
#define CONTROL_FILE_IMPOSSIBLE_LSN ((LSN)0)
/* Here is the interface of this module */
/*
LSN of the last checkoint
(if last_checkpoint_lsn == CONTROL_FILE_IMPOSSIBLE_LSN
then there was never a checkpoint)
(if last_checkpoint_lsn == LSN_IMPOSSIBLE then there was never a checkpoint)
*/
extern
LSN
last_checkpoint_lsn
;
/*
Last log number (if last_logno ==
CONTROL_FILE_IMPOSSIBLE_FILENO then there is no log
file yet)
Last log number (if last_logno ==
FILENO_IMPOSSIBLE then there is no log
file yet)
*/
extern
uint32
last_logno
;
...
...
@@ -51,6 +41,7 @@ typedef enum enum_control_file_error {
CONTROL_FILE_TOO_BIG
,
CONTROL_FILE_BAD_MAGIC_STRING
,
CONTROL_FILE_BAD_CHECKSUM
,
CONTROL_FILE_MISSING
,
CONTROL_FILE_UNKNOWN_ERROR
/* any other error */
}
CONTROL_FILE_ERROR
;
...
...
@@ -63,11 +54,11 @@ extern "C" {
#endif
/*
Looks for the control file. If
absent, it's a fresh start, create
file.
If present, read it to find out last checkpoint's LSN and last log.
Looks for the control file. If
none and creation was requested, creates
file.
If present, read
s
it to find out last checkpoint's LSN and last log.
Called at engine's start.
*/
CONTROL_FILE_ERROR
ma_control_file_create_or_open
();
CONTROL_FILE_ERROR
ma_control_file_create_or_open
(
my_bool
);
/*
Write information durably to the control file.
Called when we have created a new log (after syncing this log's creation)
...
...
storage/maria/ma_create.c
View file @
ff3e4bd9
...
...
@@ -52,8 +52,7 @@ int maria_create(const char *name, enum data_file_type datafile_type,
unique_key_parts
,
fulltext_keys
,
offset
,
not_block_record_extra_length
;
uint
max_field_lengths
,
extra_header_size
;
ulong
reclength
,
real_reclength
,
min_pack_length
;
char
filename
[
FN_REFLEN
],
dlinkname
[
FN_REFLEN
],
*
dlinkname_ptr
=
NULL
,
klinkname
[
FN_REFLEN
],
*
klinkname_ptr
=
NULL
;
char
filename
[
FN_REFLEN
],
linkname
[
FN_REFLEN
],
*
linkname_ptr
;
ulong
pack_reclength
;
ulonglong
tot_length
,
max_rows
,
tmp
;
enum
en_fieldtype
type
;
...
...
@@ -621,14 +620,14 @@ int maria_create(const char *name, enum data_file_type datafile_type,
mi_int2store
(
share
.
state
.
header
.
state_info_length
,
MARIA_STATE_INFO_SIZE
);
mi_int2store
(
share
.
state
.
header
.
base_info_length
,
MARIA_BASE_INFO_SIZE
);
mi_int2store
(
share
.
state
.
header
.
base_pos
,
base_pos
);
share
.
state
.
header
.
data_file_type
=
datafile_type
;
share
.
state
.
header
.
data_file_type
=
share
.
data_file_type
=
datafile_type
;
share
.
state
.
header
.
org_data_file_type
=
org_datafile_type
;
share
.
state
.
header
.
language
=
(
ci
->
language
?
ci
->
language
:
default_charset_info
->
number
);
share
.
state
.
dellink
=
HA_OFFSET_ERROR
;
share
.
state
.
first_bitmap_with_space
=
0
;
share
.
state
.
create_rename_lsn
=
0
;
share
.
state
.
create_rename_lsn
=
LSN_IMPOSSIBLE
;
share
.
state
.
process
=
(
ulong
)
getpid
();
share
.
state
.
unique
=
(
ulong
)
0
;
share
.
state
.
update_count
=
(
ulong
)
0
;
...
...
@@ -721,9 +720,9 @@ int maria_create(const char *name, enum data_file_type datafile_type,
MY_UNPACK_FILENAME
|
(
have_iext
?
MY_REPLACE_EXT
:
MY_APPEND_EXT
));
}
fn_format
(
k
linkname
,
name
,
""
,
MARIA_NAME_IEXT
,
fn_format
(
linkname
,
name
,
""
,
MARIA_NAME_IEXT
,
MY_UNPACK_FILENAME
|
MY_APPEND_EXT
);
klinkname_ptr
=
k
linkname
;
linkname_ptr
=
linkname
;
/*
Don't create the table if the link or file exists to ensure that one
doesn't accidently destroy another table.
...
...
@@ -739,6 +738,7 @@ int maria_create(const char *name, enum data_file_type datafile_type,
(
MY_UNPACK_FILENAME
|
(
flags
&
HA_DONT_TOUCH_DATA
)
?
MY_RETURN_REAL_PATH
:
0
)
|
MY_APPEND_EXT
);
linkname_ptr
=
NULL
;
/*
Replace the current file.
Don't sync dir now if the data file has the same path.
...
...
@@ -761,54 +761,11 @@ int maria_create(const char *name, enum data_file_type datafile_type,
goto
err
;
}
if
((
file
=
my_create_with_symlink
(
k
linkname_ptr
,
filename
,
0
,
create_mode
,
if
((
file
=
my_create_with_symlink
(
linkname_ptr
,
filename
,
0
,
create_mode
,
MYF
(
MY_WME
|
create_flag
)))
<
0
)
goto
err
;
errpos
=
1
;
if
(
!
(
flags
&
HA_DONT_TOUCH_DATA
))
{
if
(
ci
->
data_file_name
)
{
char
*
dext
=
strrchr
(
ci
->
data_file_name
,
'.'
);
int
have_dext
=
dext
&&
!
strcmp
(
dext
,
MARIA_NAME_DEXT
);
if
(
tmp_table
)
{
char
*
path
;
/* chop off the table name, tempory tables use generated name */
if
((
path
=
strrchr
(
ci
->
data_file_name
,
FN_LIBCHAR
)))
*
path
=
'\0'
;
fn_format
(
filename
,
name
,
ci
->
data_file_name
,
MARIA_NAME_DEXT
,
MY_REPLACE_DIR
|
MY_UNPACK_FILENAME
|
MY_APPEND_EXT
);
}
else
{
fn_format
(
filename
,
ci
->
data_file_name
,
""
,
MARIA_NAME_DEXT
,
MY_UNPACK_FILENAME
|
(
have_dext
?
MY_REPLACE_EXT
:
MY_APPEND_EXT
));
}
fn_format
(
dlinkname
,
name
,
""
,
MARIA_NAME_DEXT
,
MY_UNPACK_FILENAME
|
MY_APPEND_EXT
);
dlinkname_ptr
=
dlinkname
;
create_flag
=
0
;
}
else
{
fn_format
(
filename
,
name
,
""
,
MARIA_NAME_DEXT
,
MY_UNPACK_FILENAME
|
MY_APPEND_EXT
);
create_flag
=
MY_DELETE_OLD
;
}
if
((
dfile
=
my_create_with_symlink
(
dlinkname_ptr
,
filename
,
0
,
create_mode
,
MYF
(
MY_WME
|
create_flag
|
sync_dir
)))
<
0
)
goto
err
;
errpos
=
3
;
share
.
data_file_type
=
datafile_type
;
if
(
_ma_initialize_data_file
(
dfile
,
&
share
))
goto
err
;
}
DBUG_PRINT
(
"info"
,
(
"write state info and base info"
));
if
(
_ma_state_info_write
(
file
,
&
share
.
state
,
2
)
||
_ma_base_info_write
(
file
,
&
share
.
base
))
...
...
@@ -948,33 +905,38 @@ int maria_create(const char *name, enum data_file_type datafile_type,
not log 1 KB of mostly zeroes if this is a small table.
*/
char
empty_string
[]
=
""
;
LEX_STRING
log_array
[
TRANSLOG_INTERNAL_PARTS
+
3
];
LEX_STRING
log_array
[
TRANSLOG_INTERNAL_PARTS
+
4
];
uint
total_rec_length
=
0
;
uint
i
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
length
=
1
+
2
+
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
].
length
=
1
+
2
+
2
+
kfile_size_before_extension
;
/* we are needing maybe 64 kB, so don't use the stack */
log_data
=
my_malloc
(
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
length
,
MYF
(
0
));
log_data
=
my_malloc
(
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
].
length
,
MYF
(
0
));
if
((
log_data
==
NULL
)
||
my_pread
(
file
,
1
+
2
+
log_data
,
kfile_size_before_extension
,
my_pread
(
file
,
1
+
2
+
2
+
log_data
,
kfile_size_before_extension
,
0
,
MYF
(
MY_NABP
)))
goto
err
_no_lock
;
goto
err
;
/*
remember if the data file was created or not, to know if Recovery can
do it or not, in the future
*/
log_data
[
0
]
=
test
(
flags
&
HA_DONT_TOUCH_DATA
);
int2store
(
log_data
+
1
,
kfile_size_before_extension
);
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
str
=
log_data
;
int2store
(
log_data
+
1
+
2
,
share
.
base
.
keystart
);
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
str
=
(
char
*
)
name
;
/* we store the end-zero, for Recovery to just pass it to my_create() */
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
length
=
strlen
(
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
str
)
+
1
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
].
str
=
log_data
;
/* symlink description is also needed for re-creation by Recovery: */
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
].
str
=
dlinkname_ptr
?
dlinkname
:
empty_string
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
].
length
=
strlen
(
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
].
str
);
log_array
[
TRANSLOG_INTERNAL_PARTS
+
2
].
str
=
klinkname_ptr
?
klinkname
:
empty_string
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
2
].
str
=
(
char
*
)
(
ci
->
data_file_name
?
ci
->
data_file_name
:
empty_string
);
log_array
[
TRANSLOG_INTERNAL_PARTS
+
2
].
length
=
strlen
(
log_array
[
TRANSLOG_INTERNAL_PARTS
+
2
].
str
);
strlen
(
log_array
[
TRANSLOG_INTERNAL_PARTS
+
2
].
str
)
+
1
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
3
].
str
=
(
char
*
)
(
ci
->
index_file_name
?
ci
->
index_file_name
:
empty_string
);
log_array
[
TRANSLOG_INTERNAL_PARTS
+
3
].
length
=
strlen
(
log_array
[
TRANSLOG_INTERNAL_PARTS
+
3
].
str
)
+
1
;
for
(
i
=
TRANSLOG_INTERNAL_PARTS
;
i
<
(
sizeof
(
log_array
)
/
sizeof
(
log_array
[
0
]));
i
++
)
total_rec_length
+=
log_array
[
i
].
length
;
...
...
@@ -983,8 +945,14 @@ int maria_create(const char *name, enum data_file_type datafile_type,
MySQL layer to be crash-safe, which it is not now (that would require
work using the ddl_log of sql/sql_table.cc); when it is, we should
reconsider the moment of writing this log record (before or after op,
under THR_LOCK_maria or not...), how to use it in Recovery, and force
the log. For now this record is just informative.
under THR_LOCK_maria or not...), how to use it in Recovery.
For now this record can serve when we apply logs to a backup,
so we sync it. This happens before the data file is created. If the data
file was created before, and we crashed before writing the log record,
at restart the table may be used, so we would not have a trustable
history in the log (impossible to apply this log to a backup). The way
we do it, if we crash before writing the log record then there is no
data file and the table cannot be used.
Note that in case of TRUNCATE TABLE we also come here.
When in CREATE/TRUNCATE (or DROP or RENAME or REPAIR) we have not called
external_lock(), so have no TRN. It does not matter, as all these
...
...
@@ -995,21 +963,63 @@ int maria_create(const char *name, enum data_file_type datafile_type,
&
dummy_transaction_object
,
NULL
,
total_rec_length
,
sizeof
(
log_array
)
/
sizeof
(
log_array
[
0
]),
log_array
,
NULL
)))
goto
err_no_lock
;
log_array
,
NULL
)
||
translog_flush
(
share
.
state
.
create_rename_lsn
)))
goto
err
;
/*
store LSN into file, needed for Recovery to not be confused if a
DROP+CREATE happened (applying REDOs to the wrong table).
If such direct my_pwrite() to a fixed offset is too "hackish", I can
call ma_state_info_write() again but it will be less efficient.
*/
lsn_store
(
log_data
,
share
.
state
.
create_rename_lsn
);
if
(
my_pwrite
(
file
,
log_data
,
LSN_STORE_SIZE
,
sizeof
(
share
.
state
.
header
)
+
2
,
MYF
(
MY_NABP
)))
goto
err_no_lock
;
share
.
kfile
.
file
=
file
;
if
(
_ma_update_create_rename_lsn_on_disk
(
&
share
,
FALSE
))
goto
err
;
my_free
(
log_data
,
MYF
(
0
));
}
if
(
!
(
flags
&
HA_DONT_TOUCH_DATA
))
{
if
(
ci
->
data_file_name
)
{
char
*
dext
=
strrchr
(
ci
->
data_file_name
,
'.'
);
int
have_dext
=
dext
&&
!
strcmp
(
dext
,
MARIA_NAME_DEXT
);
if
(
tmp_table
)
{
char
*
path
;
/* chop off the table name, tempory tables use generated name */
if
((
path
=
strrchr
(
ci
->
data_file_name
,
FN_LIBCHAR
)))
*
path
=
'\0'
;
fn_format
(
filename
,
name
,
ci
->
data_file_name
,
MARIA_NAME_DEXT
,
MY_REPLACE_DIR
|
MY_UNPACK_FILENAME
|
MY_APPEND_EXT
);
}
else
{
fn_format
(
filename
,
ci
->
data_file_name
,
""
,
MARIA_NAME_DEXT
,
MY_UNPACK_FILENAME
|
(
have_dext
?
MY_REPLACE_EXT
:
MY_APPEND_EXT
));
}
fn_format
(
linkname
,
name
,
""
,
MARIA_NAME_DEXT
,
MY_UNPACK_FILENAME
|
MY_APPEND_EXT
);
linkname_ptr
=
linkname
;
create_flag
=
0
;
}
else
{
fn_format
(
filename
,
name
,
""
,
MARIA_NAME_DEXT
,
MY_UNPACK_FILENAME
|
MY_APPEND_EXT
);
linkname_ptr
=
NULL
;
create_flag
=
MY_DELETE_OLD
;
}
if
((
dfile
=
my_create_with_symlink
(
linkname_ptr
,
filename
,
0
,
create_mode
,
MYF
(
MY_WME
|
create_flag
|
sync_dir
)))
<
0
)
goto
err
;
errpos
=
3
;
if
(
_ma_initialize_data_file
(
dfile
,
&
share
))
goto
err
;
}
/* Enlarge files */
DBUG_PRINT
(
"info"
,
(
"enlarge to keystart: %lu"
,
(
ulong
)
share
.
base
.
keystart
));
...
...
@@ -1025,7 +1035,6 @@ int maria_create(const char *name, enum data_file_type datafile_type,
if
(
my_chsize
(
dfile
,
share
.
base
.
min_pack_length
*
ci
->
reloc_rows
,
0
,
MYF
(
0
)))
goto
err
;
#endif
errpos
=
2
;
if
((
sync_dir
&&
my_sync
(
dfile
,
MYF
(
0
)))
||
my_close
(
dfile
,
MYF
(
0
)))
goto
err
;
}
...
...
@@ -1157,3 +1166,32 @@ int _ma_initialize_data_file(File dfile, MARIA_SHARE *share)
}
return
0
;
}
/**
@brief Writes create_rename_lsn to disk, optionally forces
This is for special cases where:
- we don't want to write the full state to disk (so, not call
_ma_state_info_write()) because some parts of the state may be
currently inconsistent, or because it would be overkill
- we must sync this LSN immediately for correctness.
@param share table's share
@param do_sync if the write should be forced to disk
@return Operation status
@retval 0 ok
@retval 1 error (disk problem)
*/
int
_ma_update_create_rename_lsn_on_disk
(
MARIA_SHARE
*
share
,
my_bool
do_sync
)
{
char
buf
[
LSN_STORE_SIZE
];
File
file
=
share
->
kfile
.
file
;
DBUG_ASSERT
(
file
>=
0
);
lsn_store
(
buf
,
share
->
state
.
create_rename_lsn
);
return
(
my_pwrite
(
file
,
buf
,
sizeof
(
buf
),
sizeof
(
share
->
state
.
header
)
+
2
,
MYF
(
MY_NABP
))
||
(
do_sync
&&
my_sync
(
file
,
MYF
(
0
))));
}
storage/maria/ma_delete_all.c
View file @
ff3e4bd9
...
...
@@ -17,7 +17,7 @@
/* This clears the status information and truncates files */
#include "maria_def.h"
#include "trnman
_public
.h"
#include "trnman.h"
/**
@brief deletes all rows from a table
...
...
@@ -52,6 +52,25 @@ int maria_delete_all_rows(MARIA_HA *info)
if
(
_ma_mark_file_changed
(
info
))
goto
err
;
if
(
log_record
)
{
/*
This record will be used by Recovery to finish the deletion if it
crashed. We force it because it's a non-undoable operation.
*/
LSN
lsn
;
LEX_STRING
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
];
uchar
log_data
[
FILEID_STORE_SIZE
];
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
str
=
(
char
*
)
log_data
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
length
=
sizeof
(
log_data
);
if
(
unlikely
(
translog_write_record
(
&
lsn
,
LOGREC_REDO_DELETE_ALL
,
info
->
trn
,
share
,
0
,
sizeof
(
log_array
)
/
sizeof
(
log_array
[
0
]),
log_array
,
log_data
)
||
translog_flush
(
lsn
)))
goto
err
;
}
info
->
state
->
records
=
info
->
state
->
del
=
state
->
split
=
0
;
state
->
changed
=
0
;
/* File is optimized */
state
->
dellink
=
HA_OFFSET_ERROR
;
...
...
@@ -78,6 +97,12 @@ int maria_delete_all_rows(MARIA_HA *info)
if
(
_ma_initialize_data_file
(
info
->
dfile
.
file
,
share
))
goto
err
;
/*
The operations above on the index/data file will be forced to disk at
Checkpoint or maria_close() time. So we can reset:
*/
info
->
trn
->
rec_lsn
=
LSN_IMPOSSIBLE
;
VOID
(
_ma_writeinfo
(
info
,
WRITEINFO_UPDATE_KEYFILE
));
#ifdef HAVE_MMAP
/* Resize mmaped area */
...
...
@@ -85,38 +110,6 @@ int maria_delete_all_rows(MARIA_HA *info)
_ma_remap_file
(
info
,
(
my_off_t
)
0
);
rw_unlock
(
&
info
->
s
->
mmap_lock
);
#endif
if
(
log_record
)
{
/* For now this record is only informative */
LEX_STRING
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
];
uchar
log_data
[
LSN_STORE_SIZE
];
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
str
=
(
char
*
)
log_data
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
length
=
FILEID_STORE_SIZE
;
if
(
unlikely
(
translog_write_record
(
&
share
->
state
.
create_rename_lsn
,
LOGREC_REDO_DELETE_ALL
,
info
->
trn
,
share
,
0
,
sizeof
(
log_array
)
/
sizeof
(
log_array
[
0
]),
log_array
,
log_data
)))
goto
err
;
/*
store LSN into file. It is an optimization so that all old REDOs for
this table are ignored (scenario: checkpoint, INSERT1s, DELETE ALL;
INSERT2s, crash: then Recovery can skip INSERT1s). It also allows us to
ignore the present record at Recovery.
Note that storing the LSN could not be done by _ma_writeinfo() above as
the table is locked at this moment. So we need to do it by ourselves.
*/
lsn_store
(
log_data
,
share
->
state
.
create_rename_lsn
);
if
(
my_pwrite
(
share
->
kfile
.
file
,
log_data
,
sizeof
(
log_data
),
sizeof
(
share
->
state
.
header
)
+
2
,
MYF
(
MY_NABP
))
||
_ma_sync_table_files
(
info
))
goto
err
;
/**
@todo RECOVERY Until we take into account the log record above
for log-low-water-mark calculation and use it in Recovery, we need
to sync above.
*/
}
allow_break
();
/* Allow SIGHUP & SIGINT */
DBUG_RETURN
(
0
);
...
...
@@ -125,9 +118,11 @@ int maria_delete_all_rows(MARIA_HA *info)
int
save_errno
=
my_errno
;
VOID
(
_ma_writeinfo
(
info
,
WRITEINFO_UPDATE_KEYFILE
));
info
->
update
|=
HA_STATE_WRITTEN
;
/* Buffer changed */
/** @todo RECOVERY until we use the log record above we have to sync */
if
(
log_record
&&
_ma_sync_table_files
(
info
)
&&
!
save_errno
)
save_errno
=
my_errno
;
/**
@todo RECOVERY if we come here, Recovery may later apply the REDO above,
which may be wrong. Not fixing it now, as anyway this way of deleting
rows will have to be re-examined when we have versioning.
*/
allow_break
();
/* Allow SIGHUP & SIGINT */
DBUG_RETURN
(
my_errno
=
save_errno
);
}
...
...
storage/maria/ma_delete_table.c
View file @
ff3e4bd9
...
...
@@ -78,9 +78,9 @@ int maria_delete_table(const char *name)
{
/*
For this log record to be of any use for Recovery, we need the upper
MySQL layer to be crash-safe in DDLs
; when it is we should reconsider
the moment of writing this log record, how to use it in Recovery, and
force the log. For now this record is only informative
.
MySQL layer to be crash-safe in DDLs
.
For now this record can serve when we apply logs to a backup, so we sync
it
.
*/
LSN
lsn
;
LEX_STRING
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
];
...
...
@@ -91,7 +91,8 @@ int maria_delete_table(const char *name)
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
length
,
sizeof
(
log_array
)
/
sizeof
(
log_array
[
0
]),
log_array
,
NULL
)))
log_array
,
NULL
)
||
translog_flush
(
lsn
)))
DBUG_RETURN
(
1
);
}
...
...
storage/maria/ma_loghandler.c
View file @
ff3e4bd9
...
...
@@ -61,21 +61,6 @@
#define COMPRESSED_LSN_MAX_STORE_SIZE (2 + LSN_STORE_SIZE)
#define MAX_NUMBER_OF_LSNS_PER_RECORD 2
/* record parts descriptor */
struct
st_translog_parts
{
/* full record length */
translog_size_t
record_length
;
/* full record length with chunk headers */
translog_size_t
total_record_length
;
/* current part index */
uint
current
;
/* total number of elements in parts */
uint
elements
;
/* array of parts (LEX_STRING) */
LEX_STRING
*
parts
;
};
/* log write buffer descriptor */
struct
st_translog_buffer
{
...
...
@@ -176,15 +161,6 @@ static byte end_of_log= 0;
my_bool
translog_inited
=
0
;
/* record classes */
enum
record_class
{
LOGRECTYPE_NOT_ALLOWED
,
LOGRECTYPE_VARIABLE_LENGTH
,
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
LOGRECTYPE_FIXEDLENGTH
};
/* chunk types */
#define TRANSLOG_CHUNK_LSN 0x00
/* 0 chunk refer as LSN (head or tail */
#define TRANSLOG_CHUNK_FIXED (1 << 6)
/* 1 (pseudo)fixed record (also LSN) */
...
...
@@ -196,52 +172,11 @@ enum record_class
/* compressed (relative) LSN constants */
#define TRANSLOG_CLSN_LEN_BITS 0xC0
/* Mask to get compressed LSN length */
typedef
my_bool
(
*
prewrite_rec_hook
)
(
enum
translog_record_type
type
,
TRN
*
trn
,
struct
st_maria_share
*
share
,
struct
st_translog_parts
*
parts
);
typedef
my_bool
(
*
inwrite_rec_hook
)
(
enum
translog_record_type
type
,
TRN
*
trn
,
LSN
*
lsn
,
struct
st_translog_parts
*
parts
);
typedef
uint16
(
*
read_rec_hook
)
(
enum
translog_record_type
type
,
uint16
read_length
,
uchar
*
read_buff
,
byte
*
decoded_buff
);
/*
Descriptor of log record type
Note: Don't reorder because of constructs later...
*/
struct
st_log_record_type_descriptor
{
/* internal class of the record */
enum
record_class
class
;
/*
length for fixed-size record, pseudo-fixed record
length with uncompressed LSNs
*/
uint16
fixed_length
;
/* how much record body (belonged to headers too) read with headers */
uint16
read_header_len
;
/* HOOK for writing the record called before lock */
prewrite_rec_hook
prewrite_hook
;
/* HOOK for writing the record called when LSN is known, inside lock */
inwrite_rec_hook
inwrite_hook
;
/* HOOK for reading headers */
read_rec_hook
read_hook
;
/*
For pseudo fixed records number of compressed LSNs followed by
system header
*/
int16
compressed_LSN
;
};
#include <my_atomic.h>
/* an array that maps id of a MARIA_SHARE to this MARIA_SHARE */
static
MARIA_SHARE
**
id_to_share
=
NULL
;
#define SHARE_ID_MAX 65535
/* array's size */
/* lock for id_to_share */
static
my_atomic_rwlock_t
LOCK_id_to_share
;
...
...
@@ -257,27 +192,32 @@ static my_bool write_hook_for_undo(enum translog_record_type type,
NOTE that after first public Maria release, these can NOT be changed
*/
typedef
struct
st_log_record_type_descriptor
LOG_DESC
;
static
LOG_DESC
log_record_type_descriptor
[
LOGREC_NUMBER_OF_TYPES
];
LOG_DESC
log_record_type_descriptor
[
LOGREC_NUMBER_OF_TYPES
];
static
LOG_DESC
INIT_LOGREC_FIXED_RECORD_0LSN_EXAMPLE
=
{
LOGRECTYPE_FIXEDLENGTH
,
6
,
6
,
NULL
,
NULL
,
NULL
,
0
};
{
LOGRECTYPE_FIXEDLENGTH
,
6
,
6
,
NULL
,
NULL
,
NULL
,
0
,
"fixed0example"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_VARIABLE_RECORD_0LSN_EXAMPLE
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
9
,
NULL
,
NULL
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
9
,
NULL
,
NULL
,
NULL
,
0
,
"variable0example"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_FIXED_RECORD_1LSN_EXAMPLE
=
{
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
7
,
7
,
NULL
,
NULL
,
NULL
,
1
};
{
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
7
,
7
,
NULL
,
NULL
,
NULL
,
1
,
"fixed1example"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_VARIABLE_RECORD_1LSN_EXAMPLE
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
12
,
NULL
,
NULL
,
NULL
,
1
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
12
,
NULL
,
NULL
,
NULL
,
1
,
"variable1example"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_FIXED_RECORD_2LSN_EXAMPLE
=
{
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
23
,
23
,
NULL
,
NULL
,
NULL
,
2
};
{
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
23
,
23
,
NULL
,
NULL
,
NULL
,
2
,
"fixed2example"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_VARIABLE_RECORD_2LSN_EXAMPLE
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
19
,
NULL
,
NULL
,
NULL
,
2
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
19
,
NULL
,
NULL
,
NULL
,
2
,
"variable2example"
,
FALSE
,
NULL
,
NULL
};
void
example_loghandler_init
()
...
...
@@ -298,126 +238,158 @@ void example_loghandler_init()
static
LOG_DESC
INIT_LOGREC_RESERVED_FOR_CHUNKS23
=
{
LOGRECTYPE_NOT_ALLOWED
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
};
{
LOGRECTYPE_NOT_ALLOWED
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
,
"reserved"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_INSERT_ROW_HEAD
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
+
DIRPOS_STORE_SIZE
,
NULL
,
write_hook_for_redo
,
NULL
,
0
};
write_hook_for_redo
,
NULL
,
0
,
"redo_insert_row_head"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_INSERT_ROW_TAIL
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
+
DIRPOS_STORE_SIZE
,
NULL
,
write_hook_for_redo
,
NULL
,
0
};
write_hook_for_redo
,
NULL
,
0
,
"redo_insert_row_tail"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_INSERT_ROW_BLOB
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
8
,
NULL
,
write_hook_for_redo
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
8
,
NULL
,
write_hook_for_redo
,
NULL
,
0
,
"redo_insert_row_blob"
,
FALSE
,
NULL
,
NULL
};
/*QQQ:TODO:header???*/
static
LOG_DESC
INIT_LOGREC_REDO_INSERT_ROW_BLOBS
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
0
,
NULL
,
write_hook_for_redo
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
FILEID_STORE_SIZE
,
NULL
,
write_hook_for_redo
,
NULL
,
0
,
"redo_insert_row_blobs"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_PURGE_ROW_HEAD
=
{
LOGRECTYPE_FIXEDLENGTH
,
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
+
DIRPOS_STORE_SIZE
,
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
+
DIRPOS_STORE_SIZE
,
NULL
,
write_hook_for_redo
,
NULL
,
0
};
NULL
,
write_hook_for_redo
,
NULL
,
0
,
"redo_purge_row_head"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_PURGE_ROW_TAIL
=
{
LOGRECTYPE_FIXEDLENGTH
,
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
+
DIRPOS_STORE_SIZE
,
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
+
DIRPOS_STORE_SIZE
,
NULL
,
write_hook_for_redo
,
NULL
,
0
};
NULL
,
write_hook_for_redo
,
NULL
,
0
,
"redo_purge_row_tail"
,
FALSE
,
NULL
,
NULL
};
/* QQQ: TODO: variable and fixed size??? */
static
LOG_DESC
INIT_LOGREC_REDO_PURGE_BLOCKS
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
FILEID_STORE_SIZE
+
PAGERANGE_STORE_SIZE
+
PAGE_STORE_SIZE
+
PAGERANGE_STORE_SIZE
,
NULL
,
write_hook_for_redo
,
NULL
,
0
};
FILEID_STORE_SIZE
+
PAGERANGE_STORE_SIZE
,
NULL
,
write_hook_for_redo
,
NULL
,
0
,
"redo_purge_blocks"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_DELETE_ROW
=
{
LOGRECTYPE_FIXEDLENGTH
,
16
,
16
,
NULL
,
write_hook_for_redo
,
NULL
,
0
};
{
LOGRECTYPE_FIXEDLENGTH
,
16
,
16
,
NULL
,
write_hook_for_redo
,
NULL
,
0
,
"redo_delete_row"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_UPDATE_ROW_HEAD
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
9
,
NULL
,
write_hook_for_redo
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
9
,
NULL
,
write_hook_for_redo
,
NULL
,
0
,
"redo_update_row_head"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_INDEX
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
9
,
NULL
,
write_hook_for_redo
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
9
,
NULL
,
write_hook_for_redo
,
NULL
,
0
,
"redo_index"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_UNDELETE_ROW
=
{
LOGRECTYPE_FIXEDLENGTH
,
16
,
16
,
NULL
,
write_hook_for_redo
,
NULL
,
0
};
{
LOGRECTYPE_FIXEDLENGTH
,
16
,
16
,
NULL
,
write_hook_for_redo
,
NULL
,
0
,
"redo_undelete_row"
,
FALSE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_CLR_END
=
{
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
5
,
5
,
NULL
,
write_hook_for_redo
,
NULL
,
1
};
{
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
5
,
5
,
NULL
,
write_hook_for_redo
,
NULL
,
1
,
"clr_end"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_PURGE_END
=
{
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
5
,
5
,
NULL
,
NULL
,
NULL
,
1
};
{
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
5
,
5
,
NULL
,
NULL
,
NULL
,
1
,
"purge_end"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_UNDO_ROW_INSERT
=
{
LOGRECTYPE_FIXEDLENGTH
,
LSN_STORE_SIZE
+
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
+
DIRPOS_STORE_SIZE
,
LSN_STORE_SIZE
+
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
+
DIRPOS_STORE_SIZE
,
NULL
,
write_hook_for_undo
,
NULL
,
0
};
NULL
,
write_hook_for_undo
,
NULL
,
0
,
"undo_row_insert"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_UNDO_ROW_DELETE
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
LSN_STORE_SIZE
+
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
+
DIRPOS_STORE_SIZE
,
NULL
,
write_hook_for_undo
,
NULL
,
0
};
NULL
,
write_hook_for_undo
,
NULL
,
0
,
"undo_row_delete"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_UNDO_ROW_UPDATE
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
LSN_STORE_SIZE
+
FILEID_STORE_SIZE
+
PAGE_STORE_SIZE
+
DIRPOS_STORE_SIZE
,
NULL
,
write_hook_for_undo
,
NULL
,
1
};
NULL
,
write_hook_for_undo
,
NULL
,
1
,
"undo_row_update"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_UNDO_ROW_PURGE
=
{
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
LSN_STORE_SIZE
,
LSN_STORE_SIZE
,
NULL
,
NULL
,
NULL
,
1
};
NULL
,
NULL
,
NULL
,
1
,
"undo_row_purge"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_UNDO_KEY_INSERT
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
10
,
NULL
,
write_hook_for_undo
,
NULL
,
1
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
10
,
NULL
,
write_hook_for_undo
,
NULL
,
1
,
"undo_key_insert"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_UNDO_KEY_DELETE
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
15
,
NULL
,
write_hook_for_undo
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
15
,
NULL
,
write_hook_for_undo
,
NULL
,
0
,
"undo_key_delete"
,
TRUE
,
NULL
,
NULL
};
// QQ: why not compressed?
static
LOG_DESC
INIT_LOGREC_PREPARE
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
,
"prepare"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_PREPARE_WITH_UNDO_PURGE
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
5
,
NULL
,
NULL
,
NULL
,
1
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
5
,
NULL
,
NULL
,
NULL
,
1
,
"prepare_with_undo_purge"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_COMMIT
=
{
LOGRECTYPE_FIXEDLENGTH
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
};
{
LOGRECTYPE_FIXEDLENGTH
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
,
"commit"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_COMMIT_WITH_UNDO_PURGE
=
{
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
5
,
5
,
NULL
,
NULL
,
NULL
,
1
};
{
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
5
,
5
,
NULL
,
NULL
,
NULL
,
1
,
"commit_with_undo_purge"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_CHECKPOINT
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
,
"checkpoint"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_CREATE_TABLE
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
1
+
2
,
NULL
,
NULL
,
NULL
,
0
,
"redo_create_table"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_RENAME_TABLE
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
,
"redo_rename_table"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_DROP_TABLE
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
0
,
NULL
,
NULL
,
NULL
,
0
,
"redo_drop_table"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_DELETE_ALL
=
{
LOGRECTYPE_FIXEDLENGTH
,
FILEID_STORE_SIZE
,
FILEID_STORE_SIZE
,
NULL
,
NULL
,
NULL
,
0
};
NULL
,
write_hook_for_redo
,
NULL
,
0
,
"redo_delete_all"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_REDO_REPAIR_TABLE
=
{
LOGRECTYPE_FIXEDLENGTH
,
FILEID_STORE_SIZE
+
4
,
FILEID_STORE_SIZE
+
4
,
NULL
,
NULL
,
NULL
,
0
};
NULL
,
NULL
,
NULL
,
0
,
"redo_repair_table"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_FILE_ID
=
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
4
,
NULL
,
NULL
,
NULL
,
0
};
{
LOGRECTYPE_VARIABLE_LENGTH
,
0
,
2
,
NULL
,
NULL
,
NULL
,
0
,
"file_id"
,
TRUE
,
NULL
,
NULL
};
static
LOG_DESC
INIT_LOGREC_LONG_TRANSACTION_ID
=
{
LOGRECTYPE_FIXEDLENGTH
,
6
,
6
,
NULL
,
NULL
,
NULL
,
0
};
{
LOGRECTYPE_FIXEDLENGTH
,
6
,
6
,
NULL
,
NULL
,
NULL
,
0
,
"long_transaction_id"
,
TRUE
,
NULL
,
NULL
};
const
myf
log_write_flags
=
MY_WME
|
MY_NABP
|
MY_WAIT_IF_FULL
;
...
...
@@ -701,7 +673,7 @@ static my_bool translog_buffer_init(struct st_translog_buffer *buffer)
{
DBUG_ENTER
(
"translog_buffer_init"
);
/* This buffer offset */
buffer
->
last_lsn
=
CONTROL_FILE_IMPOSSIBLE_LSN
;
buffer
->
last_lsn
=
LSN_IMPOSSIBLE
;
/* This Buffer File */
buffer
->
file
=
-
1
;
buffer
->
overlay
=
0
;
...
...
@@ -779,7 +751,7 @@ static my_bool translog_create_new_file()
translog_write_file_header
())
DBUG_RETURN
(
1
);
if
(
ma_control_file_write_and_force
(
CONTROL_FILE_IMPOSSIBLE_LSN
,
file_no
,
if
(
ma_control_file_write_and_force
(
LSN_IMPOSSIBLE
,
file_no
,
CONTROL_FILE_UPDATE_ONLY_LOGNO
))
DBUG_RETURN
(
1
);
...
...
@@ -1206,7 +1178,7 @@ static void translog_start_buffer(struct st_translog_buffer *buffer,
(
ulong
)
LSN_OFFSET
(
log_descriptor
.
horizon
),
(
ulong
)
LSN_OFFSET
(
log_descriptor
.
horizon
)));
DBUG_ASSERT
(
buffer_no
==
buffer
->
buffer_no
);
buffer
->
last_lsn
=
CONTROL_FILE_IMPOSSIBLE_LSN
;
buffer
->
last_lsn
=
LSN_IMPOSSIBLE
;
buffer
->
offset
=
log_descriptor
.
horizon
;
buffer
->
file
=
log_descriptor
.
log_file_num
[
0
];
buffer
->
overlay
=
0
;
...
...
@@ -2088,7 +2060,7 @@ my_bool translog_init(const char *directory,
i
,
(
ulong
)
log_descriptor
.
buffers
+
i
));
}
logs_found
=
(
last_logno
!=
CONTROL_FILE_IMPOSSIBLE_FILENO
);
logs_found
=
(
last_logno
!=
FILENO_IMPOSSIBLE
);
if
(
logs_found
)
{
...
...
@@ -2100,7 +2072,7 @@ my_bool translog_init(const char *directory,
find the log end
*/
if
(
LSN_FILE_NO
(
last_checkpoint_lsn
)
==
CONTROL_FILE_IMPOSSIBLE_FILENO
)
if
(
LSN_FILE_NO
(
last_checkpoint_lsn
)
==
FILENO_IMPOSSIBLE
)
{
DBUG_ASSERT
(
LSN_OFFSET
(
last_checkpoint_lsn
)
==
0
);
/* there was no checkpoints we will read from the beginning */
...
...
@@ -2138,7 +2110,7 @@ my_bool translog_init(const char *directory,
/* TODO: check page size */
last_valid_page
=
CONTROL_FILE_IMPOSSIBLE_LSN
;
last_valid_page
=
LSN_IMPOSSIBLE
;
/* scan and validate pages */
do
{
...
...
@@ -2186,7 +2158,7 @@ my_bool translog_init(const char *directory,
current_page
=
LSN_REPLACE_OFFSET
(
current_page
,
TRANSLOG_PAGE_SIZE
);
}
while
(
LSN_FILE_NO
(
current_page
)
<=
LSN_FILE_NO
(
last_page
)
&&
!
old_log_was_recovered
);
if
(
last_valid_page
==
CONTROL_FILE_IMPOSSIBLE_LSN
)
if
(
last_valid_page
==
LSN_IMPOSSIBLE
)
{
/* Panic!!! Even page which should be valid is invalid */
/* TODO: issue error */
...
...
@@ -2272,7 +2244,7 @@ my_bool translog_init(const char *directory,
open_logfile_by_number_no_cache
(
1
))
==
-
1
||
translog_write_file_header
())
DBUG_RETURN
(
1
);
if
(
ma_control_file_write_and_force
(
CONTROL_FILE_IMPOSSIBLE_LSN
,
1
,
if
(
ma_control_file_write_and_force
(
LSN_IMPOSSIBLE
,
1
,
CONTROL_FILE_UPDATE_ONLY_LOGNO
))
DBUG_RETURN
(
1
);
/* assign buffer 0 */
...
...
@@ -2309,8 +2281,8 @@ my_bool translog_init(const char *directory,
structures for generating 2-byte ids:
*/
my_atomic_rwlock_init
(
&
LOCK_id_to_share
);
id_to_share
=
(
MARIA_SHARE
**
)
my_malloc
(
SHARE_ID_MAX
*
sizeof
(
MARIA_SHARE
*
),
MYF
(
MY_WME
|
MY_ZEROFILL
));
id_to_share
=
(
MARIA_SHARE
**
)
my_malloc
(
SHARE_ID_MAX
*
sizeof
(
MARIA_SHARE
*
),
MYF
(
MY_WME
|
MY_ZEROFILL
));
if
(
unlikely
(
!
id_to_share
))
DBUG_RETURN
(
1
);
id_to_share
--
;
/* min id is 1 */
...
...
@@ -2405,7 +2377,7 @@ void translog_destroy()
1 Error
*/
static
my_bool
translog_lock
()
my_bool
translog_lock
()
{
struct
st_translog_buffer
*
current_buffer
;
DBUG_ENTER
(
"translog_lock"
);
...
...
@@ -2438,7 +2410,7 @@ static my_bool translog_lock()
1 Error
*/
static
inline
my_bool
translog_unlock
()
my_bool
translog_unlock
()
{
DBUG_ENTER
(
"translog_unlock"
);
translog_buffer_unlock
(
log_descriptor
.
bc
.
buffer
);
...
...
@@ -4312,14 +4284,14 @@ my_bool translog_write_record(LSN *lsn,
}
if
(
unlikely
(
!
(
trn
->
first_undo_lsn
&
TRANSACTION_LOGGED_LONG_ID
)))
{
LSN
lsn
;
LSN
dummy_
lsn
;
LEX_STRING
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
];
uchar
log_data
[
6
];
int6store
(
log_data
,
trn
->
trid
);
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
str
=
(
char
*
)
log_data
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
length
=
sizeof
(
log_data
);
trn
->
first_undo_lsn
|=
TRANSACTION_LOGGED_LONG_ID
;
/* no recursion */
if
(
unlikely
(
translog_write_record
(
&
lsn
,
LOGREC_LONG_TRANSACTION_ID
,
if
(
unlikely
(
translog_write_record
(
&
dummy_
lsn
,
LOGREC_LONG_TRANSACTION_ID
,
trn
,
NULL
,
sizeof
(
log_data
),
sizeof
(
log_array
)
/
sizeof
(
log_array
[
0
]),
log_array
,
NULL
)))
...
...
@@ -4404,6 +4376,8 @@ my_bool translog_write_record(LSN *lsn,
}
}
DBUG_PRINT
(
"info"
,
(
"LSN: (%lu,0x%lx)"
,
(
ulong
)
LSN_FILE_NO
(
*
lsn
),
(
ulong
)
LSN_OFFSET
(
*
lsn
)));
DBUG_RETURN
(
rc
);
}
...
...
@@ -5093,7 +5067,7 @@ translog_read_record_header_scan(TRANSLOG_SCANNER_DATA
- it is like translog_read_record_header, but read next record, so see
its NOTES.
- in case of end of the log buff->lsn will be set to
(
CONTROL_FILE_IMPOSSIBLE_LSN
)
(
LSN_IMPOSSIBLE
)
RETURN
0 error
...
...
@@ -5138,7 +5112,7 @@ translog_size_t translog_read_next_record_header(TRANSLOG_SCANNER_DATA
if
(
scanner
->
page
[
scanner
->
page_offset
]
==
0
)
{
/* Last record was read */
buff
->
lsn
=
CONTROL_FILE_IMPOSSIBLE_LSN
;
buff
->
lsn
=
LSN_IMPOSSIBLE
;
/* Return 'end of log' marker */
DBUG_RETURN
(
TRANSLOG_RECORD_HEADER_MAX_SIZE
+
1
);
}
...
...
@@ -5300,7 +5274,7 @@ translog_size_t translog_read_record(LSN lsn,
if
(
data
==
NULL
)
{
DBUG_ASSERT
(
lsn
!=
CONTROL_FILE_IMPOSSIBLE_LSN
);
DBUG_ASSERT
(
lsn
!=
LSN_IMPOSSIBLE
);
data
=
&
internal_data
;
}
if
(
lsn
||
...
...
@@ -5707,21 +5681,23 @@ int translog_assign_id_to_share(MARIA_SHARE *share, TRN *trn)
if
(
likely
(
share
->
id
==
0
))
{
/* Inspired by set_short_trid() of trnman.c */
int
i
=
share
->
kfile
.
file
%
SHARE_ID_MAX
+
1
;
my_atomic_rwlock_wrlock
(
&
LOCK_id_to_share
);
/**
@todo RECOVERY BUG: if all slots are used, and we're using rwlocks
above, we will never exit the loop. To be discussed with Serg.
*/
for
(
;
;
i
=
i
%
SHARE_ID_MAX
+
1
)
/* the range is [1..SHARE_ID_MAX] */
uint
i
=
share
->
kfile
.
file
%
SHARE_ID_MAX
+
1
;
do
{
void
*
tmp
=
NULL
;
if
(
id_to_share
[
i
]
==
NULL
&&
my_atomic_casptr
((
void
**
)
&
id_to_share
[
i
],
&
tmp
,
share
))
break
;
}
my_atomic_rwlock_wrunlock
(
&
LOCK_id_to_share
);
share
->
id
=
(
uint16
)
i
;
my_atomic_rwlock_wrlock
(
&
LOCK_id_to_share
);
for
(
;
i
<=
SHARE_ID_MAX
;
i
++
)
/* the range is [1..SHARE_ID_MAX] */
{
void
*
tmp
=
NULL
;
if
(
id_to_share
[
i
]
==
NULL
&&
my_atomic_casptr
((
void
**
)
&
id_to_share
[
i
],
&
tmp
,
share
))
{
share
->
id
=
(
uint16
)
i
;
break
;
}
}
my_atomic_rwlock_wrunlock
(
&
LOCK_id_to_share
);
i
=
1
;
/* scan the whole array */
}
while
(
share
->
id
==
0
);
DBUG_PRINT
(
"info"
,
(
"id_to_share: 0x%lx -> %u"
,
(
ulong
)
share
,
i
));
LSN
lsn
;
LEX_STRING
log_array
[
TRANSLOG_INTERNAL_PARTS
+
2
];
...
...
@@ -5739,7 +5715,7 @@ int translog_assign_id_to_share(MARIA_SHARE *share, TRN *trn)
strlen()
*/
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
].
length
=
strlen
(
share
->
open_file_name
);
strlen
(
share
->
open_file_name
)
+
1
;
if
(
unlikely
(
translog_write_record
(
&
lsn
,
LOGREC_FILE_ID
,
trn
,
share
,
sizeof
(
log_data
)
+
log_array
[
TRANSLOG_INTERNAL_PARTS
+
...
...
@@ -5773,3 +5749,15 @@ void translog_deassign_id_from_share(MARIA_SHARE *share)
my_atomic_storeptr
((
void
**
)
&
id_to_share
[
share
->
id
],
0
);
my_atomic_rwlock_rdunlock
(
&
LOCK_id_to_share
);
}
/**
@brief returns the LSN of the first record starting in this log
@note so far works only for the very first log created on this system
*/
LSN
first_lsn_in_log
()
{
return
MAKE_LSN
(
1
,
TRANSLOG_PAGE_SIZE
+
log_descriptor
.
page_overhead
);
}
storage/maria/ma_loghandler.h
View file @
ff3e4bd9
/* Copyright (C) 2007 MySQL AB & Sanja Belkin
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; version 2 of the License.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */
#ifndef _ma_loghandler_h
#define _ma_loghandler_h
/* transaction log default cache size (TODO: make it global variable) */
#define TRANSLOG_PAGECACHE_SIZE 1024*1024*2
/* transaction log default file size (TODO: make it global variable) */
...
...
@@ -20,6 +38,7 @@
#define TRANSLOG_PAGE_SIZE (8*1024)
#include "ma_loghandler_lsn.h"
#include "trnman_public.h"
/* short transaction ID type */
typedef
uint16
SHORT_TRANSACTION_ID
;
...
...
@@ -41,6 +60,10 @@ struct st_maria_share;
#define page_store(T,A) int5store(T,A)
#define dirpos_store(T,A) ((*(uchar*) (T)) = A)
#define pagerange_store(T,A) int2store(T,A)
#define fileid_korr(P) uint2korr(P)
#define page_korr(P) uint5korr(P)
#define dirpos_korr(P) (P[0])
#define pagerange_korr(P) uint2korr(P)
/*
Length of disk drive sector size (we assume that writing it
...
...
@@ -228,10 +251,102 @@ extern translog_size_t translog_read_next_record_header(TRANSLOG_SCANNER_DATA
*
scanner
,
TRANSLOG_HEADER_BUFFER
*
buff
);
extern
my_bool
translog_lock
();
extern
my_bool
translog_unlock
();
extern
void
translog_lock_assert_owner
();
extern
TRANSLOG_ADDRESS
translog_get_horizon
();
extern
int
translog_assign_id_to_share
(
struct
st_maria_share
*
share
,
struct
st_transaction
*
trn
);
extern
void
translog_deassign_id_from_share
(
struct
st_maria_share
*
share
);
extern
my_bool
translog_inited
;
/*
all the rest added because of recovery; should we make
ma_loghandler_for_recovery.h ?
*/
#define SHARE_ID_MAX 65535
/* array's size */
extern
LSN
first_lsn_in_log
();
/* record parts descriptor */
struct
st_translog_parts
{
/* full record length */
translog_size_t
record_length
;
/* full record length with chunk headers */
translog_size_t
total_record_length
;
/* current part index */
uint
current
;
/* total number of elements in parts */
uint
elements
;
/* array of parts (LEX_STRING) */
LEX_STRING
*
parts
;
};
typedef
my_bool
(
*
prewrite_rec_hook
)
(
enum
translog_record_type
type
,
TRN
*
trn
,
struct
st_maria_share
*
share
,
struct
st_translog_parts
*
parts
);
typedef
my_bool
(
*
inwrite_rec_hook
)
(
enum
translog_record_type
type
,
TRN
*
trn
,
LSN
*
lsn
,
struct
st_translog_parts
*
parts
);
typedef
uint16
(
*
read_rec_hook
)
(
enum
translog_record_type
type
,
uint16
read_length
,
uchar
*
read_buff
,
byte
*
decoded_buff
);
/* record classes */
enum
record_class
{
LOGRECTYPE_NOT_ALLOWED
,
LOGRECTYPE_VARIABLE_LENGTH
,
LOGRECTYPE_PSEUDOFIXEDLENGTH
,
LOGRECTYPE_FIXEDLENGTH
};
/* C++ can't bear that a variable's name is "class" */
#ifndef __cplusplus
/*
Descriptor of log record type
Note: Don't reorder because of constructs later...
*/
typedef
struct
st_log_record_type_descriptor
{
/* internal class of the record */
enum
record_class
class
;
/*
length for fixed-size record, pseudo-fixed record
length with uncompressed LSNs
*/
uint16
fixed_length
;
/* how much record body (belonged to headers too) read with headers */
uint16
read_header_len
;
/* HOOK for writing the record called before lock */
prewrite_rec_hook
prewrite_hook
;
/* HOOK for writing the record called when LSN is known, inside lock */
inwrite_rec_hook
inwrite_hook
;
/* HOOK for reading headers */
read_rec_hook
read_hook
;
/*
For pseudo fixed records number of compressed LSNs followed by
system header
*/
int16
compressed_LSN
;
/* the rest is for maria_read_log & Recovery */
/** @brief for debug error messages or "maria_read_log" command-line tool */
const
char
*
name
;
my_bool
record_ends_group
;
/* a function to execute when we see the record during the REDO phase */
int
(
*
record_execute_in_redo_phase
)(
const
TRANSLOG_HEADER_BUFFER
*
);
/* a function to execute when we see the record during the UNDO phase */
int
(
*
record_execute_in_undo_phase
)(
const
TRANSLOG_HEADER_BUFFER
*
);
}
LOG_DESC
;
extern
LOG_DESC
log_record_type_descriptor
[
LOGREC_NUMBER_OF_TYPES
];
#endif
C_MODE_END
#endif
storage/maria/ma_loghandler_lsn.h
View file @
ff3e4bd9
/* Copyright (C) 2007 MySQL AB & Sanja Belkin
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; version 2 of the License.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */
#ifndef _ma_loghandler_lsn_h
#define _ma_loghandler_lsn_h
...
...
@@ -24,7 +39,7 @@ typedef TRANSLOG_ADDRESS LSN;
#define LSN_FILE_NO(L) ((L) >> 32)
/* Gets raw file number part of a LSN/log address */
#define LSN_FI
N
E_NO_PART(L) ((L) & ((int64)0xFFFFFF00000000LL))
#define LSN_FI
L
E_NO_PART(L) ((L) & ((int64)0xFFFFFF00000000LL))
/* Gets record offset of a LSN/log address */
#define LSN_OFFSET(L) ((L) & 0xFFFFFFFFL)
...
...
@@ -33,7 +48,9 @@ typedef TRANSLOG_ADDRESS LSN;
#define MAKE_LSN(F,S) ((((uint64)(F)) << 32) | (S))
/* checks LSN */
#define LSN_VALID(L) DBUG_ASSERT((L) >= 0 && (L) < (uint64)0xFFFFFFFFFFFFFFLL)
#define LSN_VALID(L) \
((LSN_FILE_NO_PART(L) != FILENO_IMPOSSIBLE) && \
(LSN_OFFSET(L) != LOG_OFFSET_IMPOSSIBLE))
/* size of stored LSN on a disk, don't change it! */
#define LSN_STORE_SIZE 7
...
...
@@ -51,7 +68,7 @@ typedef TRANSLOG_ADDRESS LSN;
/* what we need to add to LSN to increase it on one file */
#define LSN_ONE_FILE ((int64)0x100000000LL)
#define LSN_REPLACE_OFFSET(L, S) (LSN_FI
N
E_NO_PART(L) | (S))
#define LSN_REPLACE_OFFSET(L, S) (LSN_FI
L
E_NO_PART(L) | (S))
/*
an 8-byte type whose most significant byte is used for "flags"; 7
...
...
@@ -61,4 +78,7 @@ typedef LSN LSN_WITH_FLAGS;
#define LSN_WITH_FLAGS_TO_LSN(x) (x & ULL(0x00FFFFFFFFFFFFFF))
#define LSN_WITH_FLAGS_TO_FLAGS(x) (x & ULL(0xFF00000000000000))
#define FILENO_IMPOSSIBLE 0
/**< log file's numbering starts at 1 */
#define LOG_OFFSET_IMPOSSIBLE 0
/**< log always has a header */
#define LSN_IMPOSSIBLE 0
#endif
storage/maria/ma_open.c
View file @
ff3e4bd9
...
...
@@ -587,7 +587,19 @@ MARIA_HA *maria_open(const char *name, int mode, uint open_flags)
share
->
base
.
pack_bytes
+
test
(
share
->
options
&
HA_OPTION_CHECKSUM
));
if
(
share
->
base
.
transactional
)
{
share
->
base_length
+=
TRANS_ROW_EXTRA_HEADER_SIZE
;
if
(
unlikely
((
share
->
state
.
create_rename_lsn
==
(
LSN
)
ULONGLONG_MAX
)
&&
(
open_flags
&
HA_OPEN_FROM_SQL_LAYER
)))
{
/*
This table was repaired with maria_chk. Past log records should be
ignored, future log records should not: we define the present.
*/
share
->
state
.
create_rename_lsn
=
translog_get_horizon
();
_ma_update_create_rename_lsn_on_disk
(
share
,
TRUE
);
}
}
share
->
base
.
default_rec_buff_size
=
max
(
share
->
base
.
pack_reclength
,
share
->
base
.
max_key_length
);
share
->
page_type
=
(
share
->
base
.
transactional
?
PAGECACHE_LSN_PAGE
:
...
...
storage/maria/ma_pagecache.c
View file @
ff3e4bd9
...
...
@@ -587,11 +587,7 @@ static uint pagecache_fwrite(PAGECACHE *pagecache,
DBUG_PRINT
(
"info"
,
(
"Log handler call"
));
/* TODO: integrate with page format */
lsn
=
lsn_korr
(
buffer
+
PAGE_LSN_OFFSET
);
/*
check CONTROL_FILE_IMPOSSIBLE_FILENO &
CONTROL_FILE_IMPOSSIBLE_LOG_OFFSET
*/
DBUG_ASSERT
(
lsn
!=
0
);
DBUG_ASSERT
(
LSN_VALID
(
lsn
));
translog_flush
(
lsn
);
}
DBUG_RETURN
(
my_pwrite
(
filedesc
->
file
,
buffer
,
pagecache
->
block_size
,
...
...
@@ -2474,7 +2470,7 @@ static void check_and_set_lsn(LSN lsn, PAGECACHE_BLOCK_LINK *block)
lock lock change
pin pin page
first_REDO_LSN_for_page do not set it if it is zero
lsn if it is not
CONTROL_FILE_IMPOSSIBLE_LSN
(0) and it
lsn if it is not
LSN_IMPOSSIBLE
(0) and it
is bigger then LSN on the page it will be written on
the page
...
...
@@ -2566,7 +2562,7 @@ void pagecache_unlock(PAGECACHE *pagecache,
pagecache pointer to a page cache data structure
file handler for the file for the block of data to be read
pageno number of the block of data in the file
lsn if it is not
CONTROL_FILE_IMPOSSIBLE_LSN
(0) and it
lsn if it is not
LSN_IMPOSSIBLE
(0) and it
is bigger then LSN on the page it will be written on
the page
*/
...
...
@@ -2635,10 +2631,9 @@ void pagecache_unpin(PAGECACHE *pagecache,
link direct link to page (returned by read or write)
lock lock change
pin pin page
first_REDO_LSN_for_page do not set it if it is zero
lsn if it is not CONTROL_FILE_IMPOSSIBLE_LSN (0) and it
is bigger then LSN on the page it will be written on
the page
first_REDO_LSN_for_page do not set it if it is LSN_IMPOSSIBLE (0)
lsn if it is not LSN_IMPOSSIBLE and it is bigger then
LSN on the page it will be written on the page
*/
void
pagecache_unlock_by_link
(
PAGECACHE
*
pagecache
,
...
...
@@ -2681,7 +2676,7 @@ void pagecache_unlock_by_link(PAGECACHE *pagecache,
DBUG_ASSERT
(
pagecache
->
can_be_used
);
inc_counter_for_resize_op
(
pagecache
);
if
(
first_REDO_LSN_for_page
)
if
(
first_REDO_LSN_for_page
!=
LSN_IMPOSSIBLE
)
{
/*
LOCK_READ_UNLOCK is ok here as the page may have first locked
...
...
@@ -2694,10 +2689,8 @@ void pagecache_unlock_by_link(PAGECACHE *pagecache,
if
(
block
->
rec_lsn
==
0
)
block
->
rec_lsn
=
first_REDO_LSN_for_page
;
}
if
(
lsn
!=
0
)
{
if
(
lsn
!=
LSN_IMPOSSIBLE
)
check_and_set_lsn
(
lsn
,
block
);
}
if
(
make_lock_and_pin
(
pagecache
,
block
,
lock
,
pin
))
DBUG_ASSERT
(
0
);
/* should not happend */
...
...
@@ -2726,7 +2719,7 @@ void pagecache_unlock_by_link(PAGECACHE *pagecache,
pagecache_unpin_by_link()
pagecache pointer to a page cache data structure
link direct link to page (returned by read or write)
lsn if it is not
CONTROL_FILE_IMPOSSIBLE_LSN
(0) and it
lsn if it is not
LSN_IMPOSSIBLE
(0) and it
is bigger then LSN on the page it will be written on
the page
*/
...
...
storage/maria/ma_recovery.h
View file @
ff3e4bd9
/* Copyright (C) 2006
MySQL AB & MySQL Finland AB & TCX DataKonsult
AB
/* Copyright (C) 2006
,2007 MySQL
AB
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
...
...
storage/maria/ma_rename.c
View file @
ff3e4bd9
...
...
@@ -60,13 +60,13 @@ int maria_rename(const char *old_name, const char *new_name)
MY_SYNC_DIR
:
0
;
if
(
sync_dir
)
{
uchar
log_data
[
LSN_STORE_SIZE
];
uchar
log_data
[
2
+
2
];
LEX_STRING
log_array
[
TRANSLOG_INTERNAL_PARTS
+
3
];
uint
old_name_len
=
strlen
(
old_name
),
new_name_len
=
strlen
(
new_name
);
int2store
(
log_data
,
old_name_len
);
int2store
(
log_data
+
2
,
new_name_len
);
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
str
=
log_data
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
length
=
2
+
2
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
0
].
length
=
sizeof
(
log_data
)
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
].
str
=
(
char
*
)
old_name
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
1
].
length
=
old_name_len
;
log_array
[
TRANSLOG_INTERNAL_PARTS
+
2
].
str
=
(
char
*
)
new_name
;
...
...
@@ -76,15 +76,16 @@ int maria_rename(const char *old_name, const char *new_name)
MySQL layer to be crash-safe, which it is not now (that would require
work using the ddl_log of sql/sql_table.cc); when it is, we should
reconsider the moment of writing this log record (before or after op,
under THR_LOCK_maria or not...), how to use it in Recovery
, and force
the log. For now this record is just informative
.
under THR_LOCK_maria or not...), how to use it in Recovery
.
For now it can serve to apply logs to a backup so we sync it
.
*/
if
(
unlikely
(
translog_write_record
(
&
share
->
state
.
create_rename_lsn
,
LOGREC_REDO_RENAME_TABLE
,
&
dummy_transaction_object
,
NULL
,
2
+
2
+
old_name_len
+
new_name_len
,
sizeof
(
log_array
)
/
sizeof
(
log_array
[
0
]),
log_array
,
NULL
)))
log_array
,
NULL
)
||
translog_flush
(
share
->
state
.
create_rename_lsn
)))
{
maria_close
(
info
);
DBUG_RETURN
(
1
);
...
...
@@ -93,10 +94,7 @@ int maria_rename(const char *old_name, const char *new_name)
store LSN into file, needed for Recovery to not be confused if a
RENAME happened (applying REDOs to the wrong table).
*/
lsn_store
(
log_data
,
share
->
state
.
create_rename_lsn
);
if
(
my_pwrite
(
share
->
kfile
.
file
,
log_data
,
sizeof
(
log_data
),
sizeof
(
share
->
state
.
header
)
+
2
,
MYF
(
MY_NABP
))
||
my_sync
(
share
->
kfile
.
file
,
MYF
(
MY_WME
)))
if
(
_ma_update_create_rename_lsn_on_disk
(
share
,
TRUE
))
{
maria_close
(
info
);
DBUG_RETURN
(
1
);
...
...
storage/maria/ma_test1.c
View file @
ff3e4bd9
...
...
@@ -60,7 +60,7 @@ int main(int argc,char *argv[])
if
(
maria_init
()
||
(
init_pagecache
(
maria_pagecache
,
IO_SIZE
*
16
,
0
,
0
,
maria_block_size
)
==
0
)
||
ma_control_file_create_or_open
()
||
ma_control_file_create_or_open
(
TRUE
)
||
(
init_pagecache
(
maria_log_pagecache
,
TRANSLOG_PAGECACHE_SIZE
,
0
,
0
,
TRANSLOG_PAGE_SIZE
)
==
0
)
||
...
...
storage/maria/ma_test2.c
View file @
ff3e4bd9
...
...
@@ -224,7 +224,7 @@ int main(int argc, char *argv[])
/* Maria requires that we always have a page cache */
if
((
init_pagecache
(
maria_pagecache
,
pagecache_size
,
0
,
0
,
maria_block_size
)
==
0
)
||
ma_control_file_create_or_open
()
||
ma_control_file_create_or_open
(
TRUE
)
||
(
init_pagecache
(
maria_log_pagecache
,
TRANSLOG_PAGECACHE_SIZE
,
0
,
0
,
TRANSLOG_PAGE_SIZE
)
==
0
)
||
...
...
storage/maria/maria_chk.c
View file @
ff3e4bd9
...
...
@@ -1026,6 +1026,13 @@ static int maria_chk(HA_CHECK *param, my_string filename)
}
if
(
!
error
)
{
/*
Tell the server's Recovery to ignore old REDOs on this table; we don't
know what the log's end LSN is now, so we just let the server know
that it will have to find and store it.
*/
if
(
share
->
base
.
transactional
)
share
->
state
.
create_rename_lsn
=
(
LSN
)
ULONGLONG_MAX
;
if
((
param
->
testflag
&
(
T_REP_BY_SORT
|
T_REP_PARALLEL
))
&&
(
maria_is_any_key_active
(
share
->
state
.
key_map
)
||
(
rep_quick
&&
!
param
->
keys_in_use
&&
!
recreate
))
&&
...
...
storage/maria/maria_def.h
View file @
ff3e4bd9
...
...
@@ -886,13 +886,13 @@ void _ma_remap_file(MARIA_HA *info, my_off_t size);
MARIA_RECORD_POS
_ma_write_init_default
(
MARIA_HA
*
info
,
const
byte
*
record
);
my_bool
_ma_write_abort_default
(
MARIA_HA
*
info
);
/* Functions needed by _ma_check (are overrided in MySQL) */
C_MODE_START
int
_ma_repair_write_log_record
(
const
HA_CHECK
*
param
,
MARIA_HA
*
info
);
/* Functions needed by _ma_check (are overrided in MySQL) */
volatile
int
*
_ma_killed_ptr
(
HA_CHECK
*
param
);
void
_ma_check_print_error
_VARARGS
((
HA_CHECK
*
param
,
const
char
*
fmt
,
...));
void
_ma_check_print_warning
_VARARGS
((
HA_CHECK
*
param
,
const
char
*
fmt
,
...));
void
_ma_check_print_info
_VARARGS
((
HA_CHECK
*
param
,
const
char
*
fmt
,
...));
int
_ma_repair_write_log_record
(
const
HA_CHECK
*
param
,
MARIA_HA
*
info
);
C_MODE_END
int
_ma_flush_pending_blocks
(
MARIA_SORT_PARAM
*
param
);
...
...
@@ -909,6 +909,7 @@ int _ma_create_index_by_sort(MARIA_SORT_PARAM *info, my_bool no_messages,
ulong
);
int
_ma_sync_table_files
(
const
MARIA_HA
*
info
);
int
_ma_initialize_data_file
(
File
dfile
,
MARIA_SHARE
*
share
);
int
_ma_update_create_rename_lsn_on_disk
(
MARIA_SHARE
*
share
,
my_bool
do_sync
);
void
_ma_unpin_all_pages
(
MARIA_HA
*
info
,
LSN
undo_lsn
);
...
...
storage/maria/maria_read_log.c
0 → 100644
View file @
ff3e4bd9
/* Copyright (C) 2007 MySQL AB
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; version 2 of the License.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */
#include "maria_def.h"
#include <my_getopt.h>
#define PCACHE_SIZE (1024*1024*10)
#define LOG_FLAGS 0
#define LOG_FILE_SIZE (1024L*1024L)
static
PAGECACHE
pagecache
;
static
const
char
*
load_default_groups
[]
=
{
"maria_read_log"
,
0
};
static
void
get_options
(
int
*
argc
,
char
*
*
*
argv
);
#ifndef DBUG_OFF
static
const
char
*
default_dbug_option
;
#endif
static
my_bool
opt_only_display
,
opt_display_and_apply
;
struct
TRN_FOR_RECOVERY
{
LSN
group_start_lsn
,
undo_lsn
;
TrID
long_trid
;
};
struct
TRN_FOR_RECOVERY
all_active_trans
[
SHORT_TRID_MAX
+
1
];
MARIA_HA
*
all_tables
[
SHORT_TRID_MAX
+
1
];
LSN
current_group_end_lsn
=
LSN_IMPOSSIBLE
;
static
void
end_of_redo_phase
();
static
void
display_record_position
(
const
LOG_DESC
*
log_desc
,
const
TRANSLOG_HEADER_BUFFER
*
rec
,
uint
number
);
static
int
display_and_apply_record
(
const
LOG_DESC
*
log_desc
,
const
TRANSLOG_HEADER_BUFFER
*
rec
);
#define prototype_exec_hook(R) \
static int exec_LOGREC_ ## R(const TRANSLOG_HEADER_BUFFER *rec)
prototype_exec_hook
(
LONG_TRANSACTION_ID
);
#ifdef MARIA_CHECKPOINT
prototype_exec_hook
(
CHECKPOINT
);
#endif
prototype_exec_hook
(
REDO_CREATE_TABLE
);
prototype_exec_hook
(
FILE_ID
);
prototype_exec_hook
(
REDO_INSERT_ROW_HEAD
);
prototype_exec_hook
(
COMMIT
);
/*
To implement REDO_DROP_TABLE and REDO_RENAME_TABLE, we would need to go
through the all_tables[] array, find all open instances of the
table-to-drop-or-rename, and remove them from the array.
We however know that in real Recovery, we don't have to handle those log
records at all, same for REDO_CREATE_TABLE.
So for now, we can use this program to replay/debug a sequence of CREATE +
DMLs, but not DROP/RENAME; it is probably enough for a start.
*/
int
main
(
int
argc
,
char
**
argv
)
{
LSN
lsn
;
char
**
default_argv
;
MY_INIT
(
argv
[
0
]);
load_defaults
(
"my"
,
load_default_groups
,
&
argc
,
&
argv
);
default_argv
=
argv
;
get_options
(
&
argc
,
&
argv
);
maria_data_root
=
"."
;
#ifndef DBUG_OFF
#if defined(__WIN__)
default_dbug_option
=
"d:t:i:O,
\\
maria_read_log.trace"
;
#else
default_dbug_option
=
"d:t:i:o,/tmp/maria_read_log.trace"
;
#endif
if
(
argc
>
1
)
{
DBUG_SET
(
default_dbug_option
);
DBUG_SET_INITIAL
(
default_dbug_option
);
}
#endif
if
(
maria_init
())
{
fprintf
(
stderr
,
"Can't init Maria engine (%d)
\n
"
,
errno
);
goto
err
;
}
/* we don't want to create a control file, it MUST exist */
if
(
ma_control_file_create_or_open
(
FALSE
))
{
fprintf
(
stderr
,
"Can't open control file (%d)
\n
"
,
errno
);
goto
err
;
}
if
(
last_logno
==
FILENO_IMPOSSIBLE
)
{
fprintf
(
stderr
,
"Can't find any log
\n
"
);
goto
err
;
}
if
(
init_pagecache
(
&
pagecache
,
PCACHE_SIZE
,
0
,
0
,
TRANSLOG_PAGE_SIZE
)
==
0
)
{
fprintf
(
stderr
,
"Got error in init_pagecache() (errno: %d)
\n
"
,
errno
);
goto
err
;
}
/*
If log handler does not find the "last_logno" log it will return error,
which is good.
But if it finds a log and this log was crashed, it will create a new log,
which is useless. TODO: start log handler in read-only mode.
*/
if
(
translog_init
(
"."
,
LOG_FILE_SIZE
,
50112
,
0
,
&
pagecache
,
TRANSLOG_DEFAULT_FLAGS
))
{
fprintf
(
stderr
,
"Can't init loghandler (%d)
\n
"
,
errno
);
goto
err
;
}
/* install hooks for execution */
#define install_exec_hook(R) \
log_record_type_descriptor[LOGREC_ ## R].record_execute_in_redo_phase= \
exec_LOGREC_ ## R;
install_exec_hook
(
LONG_TRANSACTION_ID
);
#ifdef MARIA_CHECKPOINT
install_exec_hook
(
CHECKPOINT
);
#endif
install_exec_hook
(
REDO_CREATE_TABLE
);
install_exec_hook
(
FILE_ID
);
install_exec_hook
(
REDO_INSERT_ROW_HEAD
);
install_exec_hook
(
COMMIT
);
if
(
opt_only_display
)
printf
(
"You are using --only-display, NOTHING will be written to disk
\n
"
);
lsn
=
first_lsn_in_log
();
/*could also be last_checkpoint_lsn */
TRANSLOG_HEADER_BUFFER
rec
;
struct
st_translog_scanner_data
scanner
;
uint
i
=
1
;
translog_size_t
len
=
translog_read_record_header
(
lsn
,
&
rec
);
if
(
len
==
(
TRANSLOG_RECORD_HEADER_MAX_SIZE
+
1
))
{
printf
(
"EOF on the log
\n
"
);
goto
end
;
}
if
(
translog_init_scanner
(
lsn
,
1
,
&
scanner
))
{
fprintf
(
stderr
,
"Scanner init failed
\n
"
);
goto
err
;
}
for
(;;
i
++
)
{
uint16
sid
=
rec
.
short_trid
;
const
LOG_DESC
*
log_desc
=
&
log_record_type_descriptor
[
rec
.
type
];
display_record_position
(
log_desc
,
&
rec
,
i
);
/*
A complete group is a set of log records with an "end mark" record
(e.g. a set of REDOs for an operation, terminated by an UNDO for this
operation); if there is no "end mark" record the group is incomplete
and won't be executed.
There are pitfalls: if a table write failed, the transaction may have
put an incomplete group in the log and then a COMMIT record, that will
make a complete group which is wrong. We say that we should mark the
table corrupted if such error happens (what if it cannot be marked?).
*/
if
(
log_desc
->
record_ends_group
)
{
if
(
all_active_trans
[
sid
].
group_start_lsn
!=
LSN_IMPOSSIBLE
)
{
/*
There is a complete group for this transaction, containing more than
this event.
*/
printf
(
" ends a group:
\n
"
);
struct
st_translog_scanner_data
scanner2
;
TRANSLOG_HEADER_BUFFER
rec2
;
len
=
translog_read_record_header
(
all_active_trans
[
sid
].
group_start_lsn
,
&
rec2
);
if
(
len
==
(
TRANSLOG_RECORD_HEADER_MAX_SIZE
+
1
))
{
fprintf
(
stderr
,
"Cannot find record where it should be
\n
"
);
goto
err
;
}
if
(
translog_init_scanner
(
rec2
.
lsn
,
1
,
&
scanner2
))
{
fprintf
(
stderr
,
"Scanner2 init failed
\n
"
);
goto
err
;
}
current_group_end_lsn
=
rec
.
lsn
;
do
{
if
(
rec2
.
short_trid
==
sid
)
/* it's in our group */
{
const
LOG_DESC
*
log_desc2
=
&
log_record_type_descriptor
[
rec2
.
type
];
display_record_position
(
log_desc2
,
&
rec2
,
0
);
if
(
display_and_apply_record
(
log_desc2
,
&
rec2
))
goto
err
;
}
len
=
translog_read_next_record_header
(
&
scanner2
,
&
rec2
);
if
(
len
==
(
TRANSLOG_RECORD_HEADER_MAX_SIZE
+
1
))
{
fprintf
(
stderr
,
"Cannot find record where it should be
\n
"
);
goto
err
;
}
}
while
(
rec2
.
lsn
<
rec
.
lsn
);
translog_free_record_header
(
&
rec2
);
/* group finished */
all_active_trans
[
sid
].
group_start_lsn
=
LSN_IMPOSSIBLE
;
current_group_end_lsn
=
LSN_IMPOSSIBLE
;
/* for debugging */
}
if
(
display_and_apply_record
(
log_desc
,
&
rec
))
goto
err
;
}
else
/* record does not end group */
{
/* just record the fact, can't know if can execute yet */
if
(
all_active_trans
[
sid
].
group_start_lsn
==
LSN_IMPOSSIBLE
)
{
/* group not yet started */
all_active_trans
[
sid
].
group_start_lsn
=
rec
.
lsn
;
}
}
len
=
translog_read_next_record_header
(
&
scanner
,
&
rec
);
if
(
len
==
(
TRANSLOG_RECORD_HEADER_MAX_SIZE
+
1
))
{
printf
(
"EOF on the log
\n
"
);
goto
end
;
}
}
translog_free_record_header
(
&
rec
);
/*
So we have applied all REDOs.
We may now have unfinished transactions.
I don't think it's this program's job to roll them back:
to roll back and at the same time stay idempotent, it needs to write log
records (without CLRs, 2nd rollback would hit the effects of first
rollback and fail). But this standalone tool is not allowed to write to
the server's transaction log. So we do not roll back anything.
In the real Recovery code, or the code to do "recover after online
backup", yes we will roll back.
*/
end_of_redo_phase
();
goto
end
;
err:
/* don't touch anything more, in case we hit a bug */
exit
(
1
);
end:
maria_end
();
free_defaults
(
default_argv
);
my_end
(
0
);
exit
(
0
);
return
0
;
/* No compiler warning */
}
static
struct
my_option
my_long_options
[]
=
{
{
"only-display"
,
'o'
,
"display brief info about records's header"
,
(
gptr
*
)
&
opt_only_display
,
(
gptr
*
)
&
opt_only_display
,
0
,
GET_BOOL
,
NO_ARG
,
0
,
0
,
0
,
0
,
0
,
0
},
{
"display-and-apply"
,
'a'
,
"like --only-display but displays more info and modifies tables"
,
(
gptr
*
)
&
opt_display_and_apply
,
(
gptr
*
)
&
opt_display_and_apply
,
0
,
GET_BOOL
,
NO_ARG
,
0
,
0
,
0
,
0
,
0
,
0
},
#ifndef DBUG_OFF
{
"debug"
,
'#'
,
"Output debug log. Often this is 'd:t:o,filename'."
,
0
,
0
,
0
,
GET_STR
,
OPT_ARG
,
0
,
0
,
0
,
0
,
0
,
0
},
#endif
{
0
,
0
,
0
,
0
,
0
,
0
,
GET_NO_ARG
,
NO_ARG
,
0
,
0
,
0
,
0
,
0
,
0
}
};
#include <help_start.h>
static
void
print_version
(
void
)
{
VOID
(
printf
(
"%s Ver 1.0 for %s on %s
\n
"
,
my_progname
,
SYSTEM_TYPE
,
MACHINE_TYPE
));
NETWARE_SET_SCREEN_MODE
(
1
);
}
static
void
usage
(
void
)
{
print_version
();
puts
(
"Copyright (C) 2007 MySQL AB"
);
puts
(
"This software comes with ABSOLUTELY NO WARRANTY. This is free software,"
);
puts
(
"and you are welcome to modify and redistribute it under the GPL license
\n
"
);
puts
(
"Display and apply log records from a MARIA transaction log"
);
puts
(
"found in the current directory (for now)"
);
VOID
(
printf
(
"
\n
Usage: %s OPTIONS
\n
"
,
my_progname
));
puts
(
"You need to use one of -o or -a"
);
my_print_help
(
my_long_options
);
print_defaults
(
"my"
,
load_default_groups
);
my_print_variables
(
my_long_options
);
}
#include <help_end.h>
static
my_bool
get_one_option
(
int
optid
__attribute__
((
unused
)),
const
struct
my_option
*
opt
__attribute__
((
unused
)),
char
*
argument
__attribute__
((
unused
)))
{
/* for now there is nothing special with our options */
return
0
;
}
static
void
get_options
(
int
*
argc
,
char
***
argv
)
{
int
ho_error
;
my_progname
=
argv
[
0
][
0
];
if
((
ho_error
=
handle_options
(
argc
,
argv
,
my_long_options
,
get_one_option
)))
exit
(
ho_error
);
if
((
opt_only_display
+
opt_display_and_apply
)
!=
1
)
{
usage
();
exit
(
1
);
}
}
/* very basic info about the record's header */
static
void
display_record_position
(
const
LOG_DESC
*
log_desc
,
const
TRANSLOG_HEADER_BUFFER
*
rec
,
uint
number
)
{
/*
if number==0, we're going over records which we had already seen and which
form a group, so we indent below the group's end record
*/
printf
(
"%sRec#%u LSN (%lu,0x%lx) short_trid %u %s(num_type:%u) len %lu
\n
"
,
number
?
""
:
" "
,
number
,
(
ulong
)
LSN_FILE_NO
(
rec
->
lsn
),
(
ulong
)
LSN_OFFSET
(
rec
->
lsn
),
rec
->
short_trid
,
log_desc
->
name
,
rec
->
type
,
(
ulong
)
rec
->
record_length
);
}
static
int
display_and_apply_record
(
const
LOG_DESC
*
log_desc
,
const
TRANSLOG_HEADER_BUFFER
*
rec
)
{
int
error
;
if
(
opt_only_display
)
return
0
;
if
(
log_desc
->
record_execute_in_redo_phase
==
NULL
)
{
/* die on all not-yet-handled records :) */
DBUG_ASSERT
(
"one more hook"
==
"to write"
);
}
if
((
error
=
(
*
log_desc
->
record_execute_in_redo_phase
)(
rec
)))
fprintf
(
stderr
,
"Got error when executing record
\n
"
);
return
error
;
}
prototype_exec_hook
(
LONG_TRANSACTION_ID
)
{
uint16
sid
=
rec
->
short_trid
;
TrID
long_trid
=
all_active_trans
[
sid
].
long_trid
;
/* abort group of this trn (must be of before a crash) */
LSN
gslsn
=
all_active_trans
[
sid
].
group_start_lsn
;
char
llbuf
[
22
];
if
(
gslsn
!=
LSN_IMPOSSIBLE
)
{
printf
(
"Group at LSN (%lu,0x%lx) short_trid %u aborted
\n
"
,
(
ulong
)
LSN_FILE_NO
(
gslsn
),
(
ulong
)
LSN_OFFSET
(
gslsn
),
sid
);
all_active_trans
[
sid
].
group_start_lsn
=
LSN_IMPOSSIBLE
;
}
if
(
long_trid
!=
0
)
{
LSN
ulsn
=
all_active_trans
[
sid
].
undo_lsn
;
if
(
ulsn
!=
LSN_IMPOSSIBLE
)
{
llstr
(
long_trid
,
llbuf
);
fprintf
(
stderr
,
"Found an old transaction long_trid %s short_trid %u"
" with same short id as this new transaction, and has neither"
" committed nor rollback (undo_lsn: (%lu,0x%lx))
\n
"
,
llbuf
,
sid
,
(
ulong
)
LSN_FILE_NO
(
ulsn
),
(
ulong
)
LSN_OFFSET
(
ulsn
));
goto
err
;
}
}
long_trid
=
uint6korr
(
rec
->
header
);
all_active_trans
[
sid
].
long_trid
=
long_trid
;
llstr
(
long_trid
,
llbuf
);
printf
(
"Transaction long_trid %s short_trid %u starts
\n
"
,
llbuf
,
sid
);
goto
end
;
err:
DBUG_ASSERT
(
0
);
return
1
;
end:
return
0
;
}
#ifdef MARIA_CHECKPOINT
prototype_exec_hook
(
CHECKPOINT
)
{
/* the only checkpoint we care about was found via control file, ignore */
return
0
;
}
#endif
prototype_exec_hook
(
REDO_CREATE_TABLE
)
{
File
dfile
=
-
1
,
kfile
=
-
1
;
char
*
linkname_ptr
,
filename
[
FN_REFLEN
];
char
*
name
,
*
ptr
;
myf
create_flag
;
uint
flags
;
int
error
,
create_mode
=
O_RDWR
|
O_TRUNC
;
MARIA_HA
*
info
=
NULL
;
if
(((
name
=
my_malloc
(
rec
->
record_length
,
MYF
(
MY_WME
)))
==
NULL
)
||
(
translog_read_record
(
rec
->
lsn
,
0
,
rec
->
record_length
,
name
,
NULL
)
!=
rec
->
record_length
))
{
fprintf
(
stderr
,
"Failed to read record
\n
"
);
goto
err
;
}
printf
(
"Table '%s'"
,
name
);
/* we try hard to get create_rename_lsn, to avoid mistakes if possible */
info
=
maria_open
(
name
,
O_RDONLY
,
HA_OPEN_FOR_REPAIR
);
if
(
info
)
{
DBUG_ASSERT
(
info
->
s
->
reopen
==
1
);
/* check that we're not using it */
if
(
!
info
->
s
->
base
.
transactional
)
{
/*
could be that transactional table was later dropped, and a non-trans
one was renamed to its name, thus create_rename_lsn is 0 and should
not be trusted.
*/
printf
(
", is not transactional
\n
"
);
DBUG_ASSERT
(
0
);
/* I want to know this */
goto
end
;
}
if
(
cmp_translog_addr
(
info
->
s
->
state
.
create_rename_lsn
,
rec
->
lsn
)
>=
0
)
{
printf
(
", has create_rename_lsn (%lu,0x%lx) is more recent than record"
,
(
ulong
)
LSN_FILE_NO
(
rec
->
lsn
),
(
ulong
)
LSN_OFFSET
(
rec
->
lsn
));
goto
end
;
}
if
(
maria_is_crashed
(
info
))
{
printf
(
", is crashed, overwriting it"
);
DBUG_ASSERT
(
0
);
/* I want to know this */
}
maria_close
(
info
);
info
=
NULL
;
}
/* if does not exist, is older, or its header is corrupted, overwrite it */
// TODO symlinks
ptr
=
name
+
strlen
(
name
)
+
1
;
if
((
flags
=
ptr
[
0
]
?
HA_DONT_TOUCH_DATA
:
0
))
printf
(
", we will only touch index file"
);
fn_format
(
filename
,
name
,
""
,
MARIA_NAME_IEXT
,
(
MY_UNPACK_FILENAME
|
(
flags
&
HA_DONT_TOUCH_DATA
)
?
MY_RETURN_REAL_PATH
:
0
)
|
MY_APPEND_EXT
);
linkname_ptr
=
NULL
;
create_flag
=
MY_DELETE_OLD
;
printf
(
", creating as '%s'"
,
filename
);
if
((
kfile
=
my_create_with_symlink
(
linkname_ptr
,
filename
,
0
,
create_mode
,
MYF
(
MY_WME
|
create_flag
)))
<
0
)
{
fprintf
(
stderr
,
"Failed to create index file
\n
"
);
goto
err
;
}
ptr
++
;
uint
kfile_size_before_extension
=
uint2korr
(
ptr
);
ptr
+=
2
;
uint
keystart
=
uint2korr
(
ptr
);
ptr
+=
2
;
/* set create_rename_lsn (for maria_read_log to be idempotent) */
lsn_store
(
ptr
+
sizeof
(
info
->
s
->
state
.
header
)
+
2
,
rec
->
lsn
);
if
(
my_pwrite
(
kfile
,
ptr
,
kfile_size_before_extension
,
0
,
MYF
(
MY_NABP
|
MY_WME
))
||
my_chsize
(
kfile
,
keystart
,
0
,
MYF
(
MY_WME
)))
{
fprintf
(
stderr
,
"Failed to write to index file
\n
"
);
goto
err
;
}
if
(
!
(
flags
&
HA_DONT_TOUCH_DATA
))
{
fn_format
(
filename
,
name
,
""
,
MARIA_NAME_DEXT
,
MY_UNPACK_FILENAME
|
MY_APPEND_EXT
);
linkname_ptr
=
NULL
;
create_flag
=
MY_DELETE_OLD
;
if
((
dfile
=
my_create_with_symlink
(
linkname_ptr
,
filename
,
0
,
create_mode
,
MYF
(
MY_WME
|
create_flag
)))
<
0
)
{
fprintf
(
stderr
,
"Failed to create data file
\n
"
);
goto
err
;
}
/*
we now have an empty data file. To be able to
_ma_initialize_data_file() we need some pieces of the share to be
correctly filled. So we just open the table (fortunately, an empty
data file does not preclude this).
*/
if
(((
info
=
maria_open
(
name
,
O_RDONLY
,
0
))
==
NULL
)
||
_ma_initialize_data_file
(
dfile
,
info
->
s
))
{
fprintf
(
stderr
,
"Failed to open new table or write to data file
\n
"
);
goto
err
;
}
}
error
=
0
;
goto
end
;
err:
DBUG_ASSERT
(
0
);
error
=
1
;
end:
printf
(
"
\n
"
);
if
(
kfile
>=
0
)
error
|=
my_close
(
kfile
,
MYF
(
MY_WME
));
if
(
dfile
>=
0
)
error
|=
my_close
(
dfile
,
MYF
(
MY_WME
));
if
(
info
!=
NULL
)
error
|=
maria_close
(
info
);
my_free
(
name
,
MYF
(
MY_ALLOW_ZERO_PTR
));
return
0
;
}
prototype_exec_hook
(
FILE_ID
)
{
uint16
sid
;
int
error
;
char
*
name
,
*
buff
;
MARIA_HA
*
info
=
NULL
;
if
(((
buff
=
my_malloc
(
rec
->
record_length
,
MYF
(
MY_WME
)))
==
NULL
)
||
(
translog_read_record
(
rec
->
lsn
,
0
,
rec
->
record_length
,
buff
,
NULL
)
!=
rec
->
record_length
))
{
fprintf
(
stderr
,
"Failed to read record
\n
"
);
goto
err
;
}
sid
=
fileid_korr
(
buff
);
name
=
buff
+
FILEID_STORE_SIZE
;
printf
(
"Table '%s', id %u"
,
name
,
sid
);
info
=
all_tables
[
sid
];
if
(
info
!=
NULL
)
{
printf
(
", closing table '%s'"
,
info
->
s
->
open_file_name
);
all_tables
[
sid
]
=
NULL
;
info
->
s
->
base
.
transactional
=
TRUE
;
/* put back the truth */
if
(
maria_close
(
info
))
{
fprintf
(
stderr
,
"Failed to close table
\n
"
);
goto
err
;
}
}
info
=
maria_open
(
name
,
O_RDWR
,
HA_OPEN_FOR_REPAIR
);
if
(
info
==
NULL
)
{
printf
(
", is absent (must have been dropped later?)"
" or its header is so corrupted that we cannot open it;"
" we skip it
\n
"
);
goto
end
;
}
if
(
maria_is_crashed
(
info
))
{
fprintf
(
stderr
,
"Table is crashed, can't apply log records to it
\n
"
);
goto
err
;
}
DBUG_ASSERT
(
info
->
s
->
reopen
==
1
);
/* should always be only one instance */
if
(
!
info
->
s
->
base
.
transactional
)
{
printf
(
", is not transactional
\n
"
);
DBUG_ASSERT
(
0
);
/* I want to know this */
goto
end
;
}
all_tables
[
sid
]
=
info
;
/*
don't log any records for this work. TODO make sure this variable does not
go to disk before we restore it to its true value.
*/
info
->
s
->
base
.
transactional
=
FALSE
;
printf
(
", opened
\n
"
);
error
=
0
;
goto
end
;
err:
DBUG_ASSERT
(
0
);
error
=
1
;
if
(
info
!=
NULL
)
error
|=
maria_close
(
info
);
end:
my_free
(
buff
,
MYF
(
MY_ALLOW_ZERO_PTR
));
return
0
;
}
prototype_exec_hook
(
REDO_INSERT_ROW_HEAD
)
{
uint16
sid
;
ulonglong
page
;
MARIA_HA
*
info
;
char
llbuf
[
22
];
sid
=
fileid_korr
(
rec
->
header
);
page
=
page_korr
(
rec
->
header
+
FILEID_STORE_SIZE
);
llstr
(
page
,
llbuf
);
printf
(
"For page %s of table of short id %u"
,
llbuf
,
sid
);
info
=
all_tables
[
sid
];
if
(
info
==
NULL
)
{
printf
(
", table skipped, so skipping record
\n
"
);
goto
end
;
}
printf
(
", '%s'"
,
info
->
s
->
open_file_name
);
if
(
cmp_translog_addr
(
info
->
s
->
state
.
create_rename_lsn
,
rec
->
lsn
)
>=
0
)
{
printf
(
", has create_rename_lsn (%lu,0x%lx) is more recent than log"
" record
\n
"
,
(
ulong
)
LSN_FILE_NO
(
rec
->
lsn
),
(
ulong
)
LSN_OFFSET
(
rec
->
lsn
));
goto
end
;
}
/*
Soon we will also skip the page depending on the rec_lsn for this page in
the checkpoint record, but this is not absolutely needed for now (just
assume we have made no checkpoint).
*/
printf
(
", applying record
\n
"
);
/*
If REDO's LSN is > page's LSN (read from disk), we are going to modify the
page and change its LSN. The normal runtime code stores the UNDO's LSN
into the page. Here storing the REDO's LSN (rec->lsn) would work
(we are not writing to the log here, so don't have to "flush up to UNDO's
LSN"). But in a test scenario where we do updates at runtime, then remove
tables, apply the log and check that this results in the same table as at
runtime, putting the same LSN as runtime had done will decrease
differences. So we use the UNDO's LSN which is current_group_end_lsn.
*/
DBUG_ASSERT
(
"Monty"
==
"this is the place"
);
end:
/* as we don't have apply working: */
return
1
;
}
prototype_exec_hook
(
COMMIT
)
{
uint16
sid
=
rec
->
short_trid
;
TrID
long_trid
=
all_active_trans
[
sid
].
long_trid
;
LSN
gslsn
=
all_active_trans
[
sid
].
group_start_lsn
;
char
llbuf
[
22
];
if
(
long_trid
==
0
)
{
printf
(
"We don't know about transaction short_trid %u;"
"it probably committed long ago, forget it
\n
"
,
sid
);
return
0
;
}
llstr
(
long_trid
,
llbuf
);
printf
(
"Transaction long_trid %s short_trid %u committed"
,
llbuf
,
sid
);
if
(
gslsn
!=
LSN_IMPOSSIBLE
)
{
/*
It's not an error, it may be that trn got a disk error when writing to a
table, so an unfinished group staid in the log.
*/
printf
(
", with group at LSN (%lu,0x%lx) short_trid %u aborted
\n
"
,
(
ulong
)
LSN_FILE_NO
(
gslsn
),
(
ulong
)
LSN_OFFSET
(
gslsn
),
sid
);
all_active_trans
[
sid
].
group_start_lsn
=
LSN_IMPOSSIBLE
;
}
else
printf
(
"
\n
"
);
all_active_trans
[
sid
].
long_trid
=
0
;
#ifdef MARIA_VERSIONING
/*
if real recovery:
transaction was committed, move it to some separate list for later
purging (but don't purge now! purging may have been started before, we
may find REDO_PURGE records soon).
*/
#endif
return
0
;
}
/* Just to inform about any aborted groups or unfinished transactions */
static
void
end_of_redo_phase
()
{
uint
sid
,
unfinished
=
0
;
for
(
sid
=
0
;
sid
<=
SHORT_TRID_MAX
;
sid
++
)
{
TrID
long_trid
=
all_active_trans
[
sid
].
long_trid
;
LSN
gslsn
=
all_active_trans
[
sid
].
group_start_lsn
;
if
(
long_trid
==
0
)
continue
;
if
(
all_active_trans
[
sid
].
undo_lsn
!=
LSN_IMPOSSIBLE
)
{
char
llbuf
[
22
];
llstr
(
long_trid
,
llbuf
);
printf
(
"Transaction long_trid %s short_trid %u unfinished
\n
"
,
llbuf
,
sid
);
}
if
(
gslsn
!=
LSN_IMPOSSIBLE
)
{
printf
(
"Group at LSN (%lu,0x%lx) short_trid %u aborted
\n
"
,
(
ulong
)
LSN_FILE_NO
(
gslsn
),
(
ulong
)
LSN_OFFSET
(
gslsn
),
sid
);
}
/* If real recovery: roll back unfinished transaction */
#ifdef MARIA_VERSIONING
/*
If real recovery: transaction was committed, move it to some separate
list for soon purging.
*/
#endif
}
/*
We don't close tables if there are some unfinished transactions, because
closing tables normally requires that all unfinished transactions on them
be rolled back.
For example, closing will soon write the state to disk and when doing that
it will think this is a committed state, but it may not be.
*/
if
(
unfinished
==
0
)
{
for
(
sid
=
0
;
sid
<=
SHORT_TRID_MAX
;
sid
++
)
{
MARIA_HA
*
info
=
all_tables
[
sid
];
if
(
info
!=
NULL
)
maria_close
(
info
);
}
}
}
storage/maria/trnman_public.h
View file @
ff3e4bd9
...
...
@@ -20,6 +20,9 @@
to include my_atomic.h in C++ code.
*/
#ifndef _trnman_public_h
#define _trnman_public_h
#include "ma_loghandler_lsn.h"
C_MODE_START
...
...
@@ -52,3 +55,4 @@ my_bool trnman_has_locked_tables(TRN *trn);
void
trnman_reset_locked_tables
(
TRN
*
trn
);
C_MODE_END
#endif
storage/maria/unittest/ma_control_file-t.c
View file @
ff3e4bd9
...
...
@@ -121,8 +121,8 @@ static int delete_file(myf my_flags)
The error will however be printed on stderr.
*/
my_delete
(
file_name
,
my_flags
);
expect_checkpoint_lsn
=
CONTROL_FILE_IMPOSSIBLE_LSN
;
expect_logno
=
CONTROL_FILE_IMPOSSIBLE_FILENO
;
expect_checkpoint_lsn
=
LSN_IMPOSSIBLE
;
expect_logno
=
FILENO_IMPOSSIBLE
;
return
0
;
}
...
...
@@ -146,9 +146,9 @@ static int verify_module_values_match_expected()
*/
static
int
verify_module_values_are_impossible
()
{
RET_ERR_UNLESS
(
last_logno
==
CONTROL_FILE_IMPOSSIBLE_FILENO
);
RET_ERR_UNLESS
(
last_logno
==
FILENO_IMPOSSIBLE
);
RET_ERR_UNLESS
(
last_checkpoint_lsn
==
CONTROL_FILE_IMPOSSIBLE_LSN
);
LSN_IMPOSSIBLE
);
return
0
;
}
...
...
@@ -164,7 +164,7 @@ static int close_file()
static
int
create_or_open_file
()
{
RET_ERR_UNLESS
(
ma_control_file_create_or_open
()
==
CONTROL_FILE_OK
);
RET_ERR_UNLESS
(
ma_control_file_create_or_open
(
TRUE
)
==
CONTROL_FILE_OK
);
/* Check that the module reports expected information */
RET_ERR_UNLESS
(
verify_module_values_match_expected
()
==
0
);
return
0
;
...
...
@@ -188,7 +188,7 @@ static int test_one_log()
RET_ERR_UNLESS
(
create_or_open_file
()
==
CONTROL_FILE_OK
);
objs_to_write
=
CONTROL_FILE_UPDATE_ONLY_LOGNO
;
expect_logno
=
123
;
RET_ERR_UNLESS
(
write_file
(
CONTROL_FILE_IMPOSSIBLE_LSN
,
RET_ERR_UNLESS
(
write_file
(
LSN_IMPOSSIBLE
,
expect_logno
,
objs_to_write
)
==
0
);
RET_ERR_UNLESS
(
close_file
()
==
0
);
...
...
@@ -206,7 +206,7 @@ static int test_five_logs()
for
(
i
=
0
;
i
<
5
;
i
++
)
{
expect_logno
*=
3
;
RET_ERR_UNLESS
(
write_file
(
CONTROL_FILE_IMPOSSIBLE_LSN
,
expect_logno
,
RET_ERR_UNLESS
(
write_file
(
LSN_IMPOSSIBLE
,
expect_logno
,
objs_to_write
)
==
0
);
}
RET_ERR_UNLESS
(
close_file
()
==
0
);
...
...
@@ -320,7 +320,7 @@ static int test_bad_magic_string()
RET_ERR_UNLESS
(
my_pwrite
(
fd
,
"papa"
,
4
,
0
,
MYF
(
MY_FNABP
|
MY_WME
))
==
0
);
/* Check that control file module sees the problem */
RET_ERR_UNLESS
(
ma_control_file_create_or_open
()
==
RET_ERR_UNLESS
(
ma_control_file_create_or_open
(
TRUE
)
==
CONTROL_FILE_BAD_MAGIC_STRING
);
/* Restore magic string */
RET_ERR_UNLESS
(
my_pwrite
(
fd
,
buffer
,
4
,
0
,
MYF
(
MY_FNABP
|
MY_WME
))
==
0
);
...
...
@@ -346,7 +346,7 @@ static int test_bad_checksum()
buffer
[
0
]
+=
3
;
/* mangle checksum */
RET_ERR_UNLESS
(
my_pwrite
(
fd
,
buffer
,
1
,
8
,
MYF
(
MY_FNABP
|
MY_WME
))
==
0
);
/* Check that control file module sees the problem */
RET_ERR_UNLESS
(
ma_control_file_create_or_open
()
==
RET_ERR_UNLESS
(
ma_control_file_create_or_open
(
TRUE
)
==
CONTROL_FILE_BAD_CHECKSUM
);
/* Restore checksum */
buffer
[
0
]
-=
3
;
...
...
@@ -369,10 +369,11 @@ static int test_bad_size()
MYF
(
MY_WME
)))
>=
0
);
RET_ERR_UNLESS
(
my_write
(
fd
,
buffer
,
10
,
MYF
(
MY_FNABP
|
MY_WME
))
==
0
);
/* Check that control file module sees the problem */
RET_ERR_UNLESS
(
ma_control_file_create_or_open
()
==
CONTROL_FILE_TOO_SMALL
);
RET_ERR_UNLESS
(
ma_control_file_create_or_open
(
TRUE
)
==
CONTROL_FILE_TOO_SMALL
);
RET_ERR_UNLESS
(
my_write
(
fd
,
buffer
,
30
,
MYF
(
MY_FNABP
|
MY_WME
))
==
0
);
/* Check that control file module sees the problem */
RET_ERR_UNLESS
(
ma_control_file_create_or_open
()
==
CONTROL_FILE_TOO_BIG
);
RET_ERR_UNLESS
(
ma_control_file_create_or_open
(
TRUE
)
==
CONTROL_FILE_TOO_BIG
);
RET_ERR_UNLESS
(
my_close
(
fd
,
MYF
(
MY_WME
))
==
0
);
/* Leave a correct control file */
...
...
storage/maria/unittest/ma_test_loghandler-t.c
View file @
ff3e4bd9
...
...
@@ -164,7 +164,7 @@ int main(int argc __attribute__((unused)), char *argv[])
}
#endif
if
(
ma_control_file_create_or_open
())
if
(
ma_control_file_create_or_open
(
TRUE
))
{
fprintf
(
stderr
,
"Can't init control file (%d)
\n
"
,
errno
);
exit
(
1
);
...
...
@@ -336,7 +336,7 @@ int main(int argc __attribute__((unused)), char *argv[])
ma_control_file_end
();
if
(
ma_control_file_create_or_open
())
if
(
ma_control_file_create_or_open
(
TRUE
))
{
fprintf
(
stderr
,
"pass2: Can't init control file (%d)
\n
"
,
errno
);
exit
(
1
);
...
...
@@ -398,7 +398,7 @@ int main(int argc __attribute__((unused)), char *argv[])
i
,
errno
);
goto
err
;
}
if
(
rec
.
lsn
==
CONTROL_FILE_IMPOSSIBLE_LSN
)
if
(
rec
.
lsn
==
LSN_IMPOSSIBLE
)
{
if
(
i
!=
ITERATIONS
)
{
...
...
@@ -477,7 +477,7 @@ int main(int argc __attribute__((unused)), char *argv[])
"failed (%d)
\n
"
,
i
,
errno
);
goto
err
;
}
if
(
rec
.
lsn
==
CONTROL_FILE_IMPOSSIBLE_LSN
)
if
(
rec
.
lsn
==
LSN_IMPOSSIBLE
)
{
fprintf
(
stderr
,
"EOL met at the middle of iteration (first var) %u "
"instead of beginning of %u
\n
"
,
i
,
ITERATIONS
);
...
...
@@ -572,7 +572,7 @@ int main(int argc __attribute__((unused)), char *argv[])
i
,
errno
);
goto
err
;
}
if
(
rec
.
lsn
==
CONTROL_FILE_IMPOSSIBLE_LSN
)
if
(
rec
.
lsn
==
LSN_IMPOSSIBLE
)
{
fprintf
(
stderr
,
"EOL met at the middle of iteration %u "
"instead of beginning of %u
\n
"
,
i
,
ITERATIONS
);
...
...
storage/maria/unittest/ma_test_loghandler_multigroup-t.c
View file @
ff3e4bd9
...
...
@@ -161,7 +161,7 @@ int main(int argc __attribute__((unused)), char *argv[])
}
#endif
if
(
ma_control_file_create_or_open
())
if
(
ma_control_file_create_or_open
(
TRUE
))
{
fprintf
(
stderr
,
"Can't init control file (%d)
\n
"
,
errno
);
exit
(
1
);
...
...
@@ -325,7 +325,7 @@ int main(int argc __attribute__((unused)), char *argv[])
end_pagecache
(
&
pagecache
,
1
);
ma_control_file_end
();
if
(
ma_control_file_create_or_open
())
if
(
ma_control_file_create_or_open
(
TRUE
))
{
fprintf
(
stderr
,
"pass2: Can't init control file (%d)
\n
"
,
errno
);
exit
(
1
);
...
...
@@ -390,7 +390,7 @@ int main(int argc __attribute__((unused)), char *argv[])
translog_free_record_header
(
&
rec
);
goto
err
;
}
if
(
rec
.
lsn
==
CONTROL_FILE_IMPOSSIBLE_LSN
)
if
(
rec
.
lsn
==
LSN_IMPOSSIBLE
)
{
if
(
i
!=
ITERATIONS
)
{
...
...
@@ -470,7 +470,7 @@ int main(int argc __attribute__((unused)), char *argv[])
"failed (%d)
\n
"
,
i
,
errno
);
goto
err
;
}
if
(
rec
.
lsn
==
CONTROL_FILE_IMPOSSIBLE_LSN
)
if
(
rec
.
lsn
==
LSN_IMPOSSIBLE
)
{
fprintf
(
stderr
,
"EOL met at the middle of iteration (first var) %u "
"instead of beginning of %u
\n
"
,
i
,
ITERATIONS
);
...
...
@@ -568,7 +568,7 @@ int main(int argc __attribute__((unused)), char *argv[])
translog_free_record_header
(
&
rec
);
goto
err
;
}
if
(
rec
.
lsn
==
CONTROL_FILE_IMPOSSIBLE_LSN
)
if
(
rec
.
lsn
==
LSN_IMPOSSIBLE
)
{
fprintf
(
stderr
,
"EOL met at the middle of iteration %u "
"instead of beginning of %u
\n
"
,
i
,
ITERATIONS
);
...
...
storage/maria/unittest/ma_test_loghandler_multithread-t.c
View file @
ff3e4bd9
...
...
@@ -270,7 +270,7 @@ int main(int argc __attribute__((unused)),
my_thread_global_init
();
if
(
ma_control_file_create_or_open
())
if
(
ma_control_file_create_or_open
(
TRUE
))
{
fprintf
(
stderr
,
"Can't init control file (%d)
\n
"
,
errno
);
exit
(
1
);
...
...
@@ -384,7 +384,7 @@ int main(int argc __attribute__((unused)),
translog_free_record_header
(
&
rec
);
goto
err
;
}
if
(
rec
.
lsn
==
CONTROL_FILE_IMPOSSIBLE_LSN
)
if
(
rec
.
lsn
==
LSN_IMPOSSIBLE
)
{
if
(
i
!=
WRITERS
*
ITERATIONS
*
2
)
{
...
...
storage/maria/unittest/ma_test_loghandler_pagecache-t.c
View file @
ff3e4bd9
...
...
@@ -56,7 +56,7 @@ int main(int argc __attribute__((unused)), char *argv[])
}
#endif
if
(
ma_control_file_create_or_open
())
if
(
ma_control_file_create_or_open
(
TRUE
))
{
fprintf
(
stderr
,
"Can't init control file (%d)
\n
"
,
errno
);
exit
(
1
);
...
...
storage/myisam/mi_close.c
View file @
ff3e4bd9
...
...
@@ -75,6 +75,7 @@ int mi_close(register MI_INFO *info)
not change the crashed state.
We can NOT write the state in other cases as other threads
may be using the file at this point
IF using --external-locking.
*/
if
(
share
->
mode
!=
O_RDONLY
&&
mi_is_crashed
(
info
))
mi_state_info_write
(
share
->
kfile
,
&
share
->
state
,
1
);
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment