1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
1016
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
1036
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
1054
1055
1056
1057
1058
1059
1060
|
/*****************************************************************************
Copyright (c) 2013, 2016, Oracle and/or its affiliates. All Rights Reserved.
Copyright (c) 2017, 2019, MariaDB Corporation.
This program is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free Software
Foundation; version 2 of the License.
This program is distributed in the hope that it will be useful, but WITHOUT
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
You should have received a copy of the GNU General Public License along with
this program; if not, write to the Free Software Foundation, Inc.,
51 Franklin Street, Fifth Floor, Boston, MA 02110-1335 USA
*****************************************************************************/
/**************************************************//**
@file fsp/fsp0file.cc
Tablespace data file implementation
Created 2013-7-26 by Kevin Lewis
*******************************************************/
#include "fil0fil.h"
#include "fsp0types.h"
#include "os0file.h"
#include "page0page.h"
#include "srv0start.h"
/** Initialize the name, size and order of this datafile
@param[in] name tablespace name, will be copied
@param[in] flags tablespace flags */
void
Datafile::init(
const char* name,
ulint flags)
{
ut_ad(m_name == NULL);
ut_ad(name != NULL);
m_name = mem_strdup(name);
m_flags = flags;
}
/** Release the resources. */
void
Datafile::shutdown()
{
close();
ut_free(m_name);
m_name = NULL;
free_filepath();
free_first_page();
}
/** Create/open a data file.
@param[in] read_only_mode if true, then readonly mode checks are enforced.
@return DB_SUCCESS or error code */
dberr_t
Datafile::open_or_create(bool read_only_mode)
{
bool success;
ut_a(m_filepath != NULL);
ut_ad(m_handle == OS_FILE_CLOSED);
m_handle = os_file_create(
innodb_data_file_key, m_filepath, m_open_flags,
OS_FILE_NORMAL, OS_DATA_FILE, read_only_mode, &success);
if (!success) {
m_last_os_error = os_file_get_last_error(true);
ib::error() << "Cannot open datafile '" << m_filepath << "'";
return(DB_CANNOT_OPEN_FILE);
}
return(DB_SUCCESS);
}
/** Open a data file in read-only mode to check if it exists so that it
can be validated.
@param[in] strict whether to issue error messages
@return DB_SUCCESS or error code */
dberr_t
Datafile::open_read_only(bool strict)
{
bool success = false;
ut_ad(m_handle == OS_FILE_CLOSED);
/* This function can be called for file objects that do not need
to be opened, which is the case when the m_filepath is NULL */
if (m_filepath == NULL) {
return(DB_ERROR);
}
set_open_flags(OS_FILE_OPEN);
m_handle = os_file_create_simple_no_error_handling(
innodb_data_file_key, m_filepath, m_open_flags,
OS_FILE_READ_ONLY, true, &success);
if (success) {
m_exists = true;
init_file_info();
return(DB_SUCCESS);
}
if (strict) {
m_last_os_error = os_file_get_last_error(true);
ib::error() << "Cannot open datafile for read-only: '"
<< m_filepath << "' OS error: " << m_last_os_error;
}
return(DB_CANNOT_OPEN_FILE);
}
/** Open a data file in read-write mode during start-up so that
doublewrite pages can be restored and then it can be validated.*
@param[in] read_only_mode if true, then readonly mode checks are enforced.
@return DB_SUCCESS or error code */
dberr_t
Datafile::open_read_write(bool read_only_mode)
{
bool success = false;
ut_ad(m_handle == OS_FILE_CLOSED);
/* This function can be called for file objects that do not need
to be opened, which is the case when the m_filepath is NULL */
if (m_filepath == NULL) {
return(DB_ERROR);
}
set_open_flags(OS_FILE_OPEN);
m_handle = os_file_create_simple_no_error_handling(
innodb_data_file_key, m_filepath, m_open_flags,
OS_FILE_READ_WRITE, read_only_mode, &success);
if (!success) {
m_last_os_error = os_file_get_last_error(true);
ib::error() << "Cannot open datafile for read-write: '"
<< m_filepath << "'";
return(DB_CANNOT_OPEN_FILE);
}
m_exists = true;
init_file_info();
return(DB_SUCCESS);
}
/** Initialize OS specific file info. */
void
Datafile::init_file_info()
{
#ifdef _WIN32
GetFileInformationByHandle(m_handle, &m_file_info);
#else
fstat(m_handle, &m_file_info);
#endif /* WIN32 */
}
/** Close a data file.
@return DB_SUCCESS or error code */
dberr_t
Datafile::close()
{
if (m_handle != OS_FILE_CLOSED) {
ibool success = os_file_close(m_handle);
ut_a(success);
m_handle = OS_FILE_CLOSED;
}
return(DB_SUCCESS);
}
/** Make a full filepath from a directory path and a filename.
Prepend the dirpath to filename using the extension given.
If dirpath is NULL, prepend the default datadir to filepath.
Store the result in m_filepath.
@param[in] dirpath directory path
@param[in] filename filename or filepath
@param[in] ext filename extension */
void
Datafile::make_filepath(
const char* dirpath,
const char* filename,
ib_extention ext)
{
ut_ad(dirpath != NULL || filename != NULL);
free_filepath();
m_filepath = fil_make_filepath(dirpath, filename, ext, false);
ut_ad(m_filepath != NULL);
set_filename();
}
/** Set the filepath by duplicating the filepath sent in. This is the
name of the file with its extension and absolute or relative path.
@param[in] filepath filepath to set */
void
Datafile::set_filepath(const char* filepath)
{
free_filepath();
m_filepath = static_cast<char*>(ut_malloc_nokey(strlen(filepath) + 1));
::strcpy(m_filepath, filepath);
set_filename();
}
/** Free the filepath buffer. */
void
Datafile::free_filepath()
{
if (m_filepath != NULL) {
ut_free(m_filepath);
m_filepath = NULL;
m_filename = NULL;
}
}
/** Do a quick test if the filepath provided looks the same as this filepath
byte by byte. If they are two different looking paths to the same file,
same_as() will be used to show that after the files are opened.
@param[in] other filepath to compare with
@retval true if it is the same filename by byte comparison
@retval false if it looks different */
bool
Datafile::same_filepath_as(
const char* other) const
{
return(0 == strcmp(m_filepath, other));
}
/** Test if another opened datafile is the same file as this object.
@param[in] other Datafile to compare with
@return true if it is the same file, else false */
bool
Datafile::same_as(
const Datafile& other) const
{
#ifdef _WIN32
return(m_file_info.dwVolumeSerialNumber
== other.m_file_info.dwVolumeSerialNumber
&& m_file_info.nFileIndexHigh
== other.m_file_info.nFileIndexHigh
&& m_file_info.nFileIndexLow
== other.m_file_info.nFileIndexLow);
#else
return(m_file_info.st_ino == other.m_file_info.st_ino
&& m_file_info.st_dev == other.m_file_info.st_dev);
#endif /* WIN32 */
}
/** Allocate and set the datafile or tablespace name in m_name.
If a name is provided, use it; else extract a file-per-table
tablespace name from m_filepath. The value of m_name
will be freed in the destructor.
@param[in] name tablespace name if known, NULL if not */
void
Datafile::set_name(const char* name)
{
ut_free(m_name);
if (name != NULL) {
m_name = mem_strdup(name);
} else {
m_name = fil_path_to_space_name(m_filepath);
}
}
/** Reads a few significant fields from the first page of the first
datafile. The Datafile must already be open.
@param[in] read_only_mode If true, then readonly mode checks are enforced.
@return DB_SUCCESS or DB_IO_ERROR if page cannot be read */
dberr_t
Datafile::read_first_page(bool read_only_mode)
{
if (m_handle == OS_FILE_CLOSED) {
dberr_t err = open_or_create(read_only_mode);
if (err != DB_SUCCESS) {
return(err);
}
}
m_first_page_buf = static_cast<byte*>(
ut_malloc_nokey(2 * UNIV_PAGE_SIZE_MAX));
/* Align the memory for a possible read from a raw device */
m_first_page = static_cast<byte*>(
ut_align(m_first_page_buf, srv_page_size));
IORequest request;
dberr_t err = DB_ERROR;
size_t page_size = UNIV_PAGE_SIZE_MAX;
/* Don't want unnecessary complaints about partial reads. */
request.disable_partial_io_warnings();
while (page_size >= UNIV_PAGE_SIZE_MIN) {
ulint n_read = 0;
err = os_file_read_no_error_handling(
request, m_handle, m_first_page, 0, page_size, &n_read);
if (err == DB_IO_ERROR && n_read >= UNIV_PAGE_SIZE_MIN) {
page_size >>= 1;
} else if (err == DB_SUCCESS) {
ut_a(n_read == page_size);
break;
} else if (srv_operation == SRV_OPERATION_BACKUP) {
break;
} else {
ib::error()
<< "Cannot read first page of '"
<< m_filepath << "' "
<< ut_strerr(err);
break;
}
}
if (err != DB_SUCCESS) {
return(err);
}
if (m_order == 0) {
m_space_id = fsp_header_get_space_id(m_first_page);
m_flags = fsp_header_get_flags(m_first_page);
if (!fil_space_t::is_valid_flags(m_flags, m_space_id)) {
ulint cflags = fsp_flags_convert_from_101(m_flags);
if (cflags == ULINT_UNDEFINED) {
ib::error()
<< "Invalid flags " << ib::hex(m_flags)
<< " in " << m_filepath;
return(DB_CORRUPTION);
} else {
m_flags = cflags;
}
}
}
const size_t physical_size = fil_space_t::physical_size(m_flags);
if (physical_size > page_size) {
ib::error() << "File " << m_filepath
<< " should be longer than "
<< page_size << " bytes";
return(DB_CORRUPTION);
}
return(err);
}
/** Free the first page from memory when it is no longer needed. */
void
Datafile::free_first_page()
{
if (m_first_page_buf) {
ut_free(m_first_page_buf);
m_first_page_buf = NULL;
m_first_page = NULL;
}
}
/** Validates the datafile and checks that it conforms with the expected
space ID and flags. The file should exist and be successfully opened
in order for this function to validate it.
@param[in] space_id The expected tablespace ID.
@param[in] flags The expected tablespace flags.
@retval DB_SUCCESS if tablespace is valid, DB_ERROR if not.
m_is_valid is also set true on success, else false. */
dberr_t
Datafile::validate_to_dd(ulint space_id, ulint flags)
{
dberr_t err;
if (!is_open()) {
return DB_ERROR;
}
/* Validate this single-table-tablespace with the data dictionary,
but do not compare the DATA_DIR flag, in case the tablespace was
remotely located. */
err = validate_first_page(0);
if (err != DB_SUCCESS) {
return(err);
}
flags &= ~FSP_FLAGS_MEM_MASK;
/* Make sure the datafile we found matched the space ID.
If the datafile is a file-per-table tablespace then also match
the row format and zip page size. */
if (m_space_id == space_id
&& (fil_space_t::is_flags_equal(flags, m_flags)
|| fil_space_t::is_flags_equal(m_flags, flags))) {
/* Datafile matches the tablespace expected. */
return(DB_SUCCESS);
}
/* else do not use this tablespace. */
m_is_valid = false;
ib::error() << "Refusing to load '" << m_filepath << "' (id="
<< m_space_id << ", flags=" << ib::hex(m_flags)
<< "); dictionary contains id="
<< space_id << ", flags=" << ib::hex(flags);
return(DB_ERROR);
}
/** Validates this datafile for the purpose of recovery. The file should
exist and be successfully opened. We initially open it in read-only mode
because we just want to read the SpaceID. However, if the first page is
corrupt and needs to be restored from the doublewrite buffer, we will
reopen it in write mode and ry to restore that page.
@retval DB_SUCCESS if tablespace is valid, DB_ERROR if not.
m_is_valid is also set true on success, else false. */
dberr_t
Datafile::validate_for_recovery()
{
dberr_t err;
ut_ad(is_open());
ut_ad(!srv_read_only_mode);
err = validate_first_page(0);
switch (err) {
case DB_SUCCESS:
case DB_TABLESPACE_EXISTS:
break;
default:
/* Re-open the file in read-write mode Attempt to restore
page 0 from doublewrite and read the space ID from a survey
of the first few pages. */
close();
err = open_read_write(srv_read_only_mode);
if (err != DB_SUCCESS) {
return(err);
}
err = find_space_id();
if (err != DB_SUCCESS || m_space_id == 0) {
ib::error() << "Datafile '" << m_filepath << "' is"
" corrupted. Cannot determine the space ID from"
" the first 64 pages.";
return(err);
}
if (restore_from_doublewrite()) {
return(DB_CORRUPTION);
}
/* Free the previously read first page and then re-validate. */
free_first_page();
err = validate_first_page(0);
}
if (err == DB_SUCCESS) {
set_name(NULL);
}
return(err);
}
/** Check the consistency of the first page of a datafile when the
tablespace is opened. This occurs before the fil_space_t is created
so the Space ID found here must not already be open.
m_is_valid is set true on success, else false.
@param[out] flush_lsn contents of FIL_PAGE_FILE_FLUSH_LSN
@retval DB_SUCCESS on if the datafile is valid
@retval DB_CORRUPTION if the datafile is not readable
@retval DB_TABLESPACE_EXISTS if there is a duplicate space_id */
dberr_t
Datafile::validate_first_page(lsn_t* flush_lsn)
{
char* prev_name;
char* prev_filepath;
const char* error_txt = NULL;
m_is_valid = true;
if (m_first_page == NULL
&& read_first_page(srv_read_only_mode) != DB_SUCCESS) {
error_txt = "Cannot read first page";
} else {
ut_ad(m_first_page_buf);
ut_ad(m_first_page);
if (flush_lsn != NULL) {
*flush_lsn = mach_read_from_8(
m_first_page + FIL_PAGE_FILE_FLUSH_LSN_OR_KEY_VERSION);
}
}
if (error_txt != NULL) {
err_exit:
ib::info() << error_txt << " in datafile: " << m_filepath
<< ", Space ID:" << m_space_id << ", Flags: "
<< m_flags;
m_is_valid = false;
free_first_page();
return(DB_CORRUPTION);
}
/* Check if the whole page is blank. */
if (!m_space_id && !m_flags) {
const byte* b = m_first_page;
ulint nonzero_bytes = srv_page_size;
while (*b == '\0' && --nonzero_bytes != 0) {
b++;
}
if (nonzero_bytes == 0) {
error_txt = "Header page consists of zero bytes";
goto err_exit;
}
}
if (!fil_space_t::is_valid_flags(m_flags, m_space_id)) {
/* Tablespace flags must be valid. */
error_txt = "Tablespace flags are invalid";
goto err_exit;
}
ulint logical_size = fil_space_t::logical_size(m_flags);
if (srv_page_size != logical_size) {
/* Logical size must be innodb_page_size. */
ib::error()
<< "Data file '" << m_filepath << "' uses page size "
<< logical_size << ", but the innodb_page_size"
" start-up parameter is "
<< srv_page_size;
free_first_page();
return(DB_ERROR);
}
if (page_get_page_no(m_first_page) != 0) {
/* First page must be number 0 */
error_txt = "Header page contains inconsistent data";
goto err_exit;
}
if (m_space_id >= SRV_LOG_SPACE_FIRST_ID) {
error_txt = "A bad Space ID was found";
goto err_exit;
}
if (buf_page_is_corrupted(false, m_first_page, m_flags)) {
/* Look for checksum and other corruptions. */
error_txt = "Checksum mismatch";
goto err_exit;
}
if (fil_space_read_name_and_filepath(
m_space_id, &prev_name, &prev_filepath)) {
if (0 == strcmp(m_filepath, prev_filepath)) {
ut_free(prev_name);
ut_free(prev_filepath);
return(DB_SUCCESS);
}
/* Make sure the space_id has not already been opened. */
ib::error() << "Attempted to open a previously opened"
" tablespace. Previous tablespace " << prev_name
<< " at filepath: " << prev_filepath
<< " uses space ID: " << m_space_id
<< ". Cannot open filepath: " << m_filepath
<< " which uses the same space ID.";
ut_free(prev_name);
ut_free(prev_filepath);
m_is_valid = false;
free_first_page();
return(is_predefined_tablespace(m_space_id)
? DB_CORRUPTION
: DB_TABLESPACE_EXISTS);
}
return(DB_SUCCESS);
}
/** Determine the space id of the given file descriptor by reading a few
pages from the beginning of the .ibd file.
@return DB_SUCCESS if space id was successfully identified, else DB_ERROR. */
dberr_t
Datafile::find_space_id()
{
os_offset_t file_size;
ut_ad(m_handle != OS_FILE_CLOSED);
file_size = os_file_get_size(m_handle);
if (file_size == (os_offset_t) -1) {
ib::error() << "Could not get file size of datafile '"
<< m_filepath << "'";
return(DB_CORRUPTION);
}
/* Assuming a page size, read the space_id from each page and store it
in a map. Find out which space_id is agreed on by majority of the
pages. Choose that space_id. */
for (ulint page_size = UNIV_ZIP_SIZE_MIN;
page_size <= UNIV_PAGE_SIZE_MAX;
page_size <<= 1) {
/* map[space_id] = count of pages */
typedef std::map<
ulint,
ulint,
std::less<ulint>,
ut_allocator<std::pair<const ulint, ulint> > >
Pages;
Pages verify;
ulint page_count = 64;
ulint valid_pages = 0;
/* Adjust the number of pages to analyze based on file size */
while ((page_count * page_size) > file_size) {
--page_count;
}
ib::info()
<< "Page size:" << page_size
<< ". Pages to analyze:" << page_count;
byte* buf = static_cast<byte*>(
ut_malloc_nokey(2 * UNIV_PAGE_SIZE_MAX));
byte* page = static_cast<byte*>(
ut_align(buf, UNIV_SECTOR_SIZE));
ulint fsp_flags;
/* provide dummy value if the first os_file_read() fails */
switch (srv_checksum_algorithm) {
case SRV_CHECKSUM_ALGORITHM_STRICT_FULL_CRC32:
case SRV_CHECKSUM_ALGORITHM_FULL_CRC32:
fsp_flags = 1U << FSP_FLAGS_FCRC32_POS_MARKER
| FSP_FLAGS_FCRC32_PAGE_SSIZE()
| innodb_compression_algorithm
<< FSP_FLAGS_FCRC32_POS_COMPRESSED_ALGO;
break;
default:
fsp_flags = 0;
}
for (ulint j = 0; j < page_count; ++j) {
dberr_t err;
ulint n_bytes = j * page_size;
IORequest request(IORequest::READ);
err = os_file_read(
request, m_handle, page, n_bytes, page_size);
if (err != DB_SUCCESS) {
ib::info()
<< "READ FAIL: page_no:" << j;
continue;
}
if (j == 0) {
fsp_flags = mach_read_from_4(
page + FSP_HEADER_OFFSET + FSP_SPACE_FLAGS);
}
bool noncompressed_ok = false;
/* For noncompressed pages, the page size must be
equal to srv_page_size. */
if (page_size == srv_page_size) {
noncompressed_ok = !buf_page_is_corrupted(
false, page, fsp_flags);
}
bool compressed_ok = false;
if (srv_page_size <= UNIV_PAGE_SIZE_DEF
&& page_size <= srv_page_size) {
compressed_ok = !buf_page_is_corrupted(
false, page, fsp_flags);
}
if (noncompressed_ok || compressed_ok) {
ulint space_id = mach_read_from_4(page
+ FIL_PAGE_SPACE_ID);
if (space_id > 0) {
ib::info()
<< "VALID: space:"
<< space_id << " page_no:" << j
<< " page_size:" << page_size;
++valid_pages;
++verify[space_id];
}
}
}
ut_free(buf);
ib::info()
<< "Page size: " << page_size
<< ". Possible space_id count:" << verify.size();
const ulint pages_corrupted = 3;
for (ulint missed = 0; missed <= pages_corrupted; ++missed) {
for (Pages::const_iterator it = verify.begin();
it != verify.end();
++it) {
ib::info() << "space_id:" << it->first
<< ", Number of pages matched: "
<< it->second << "/" << valid_pages
<< " (" << page_size << ")";
if (it->second == (valid_pages - missed)) {
ib::info() << "Chosen space:"
<< it->first;
m_space_id = it->first;
return(DB_SUCCESS);
}
}
}
}
return(DB_CORRUPTION);
}
/** Restore the first page of the tablespace from
the double write buffer.
@return whether the operation failed */
bool
Datafile::restore_from_doublewrite()
{
if (srv_operation != SRV_OPERATION_NORMAL) {
return true;
}
/* Find if double write buffer contains page_no of given space id. */
const byte* page = recv_sys->dblwr.find_page(m_space_id, 0);
const page_id_t page_id(m_space_id, 0);
if (page == NULL) {
/* If the first page of the given user tablespace is not there
in the doublewrite buffer, then the recovery is going to fail
now. Hence this is treated as an error. */
ib::error()
<< "Corrupted page " << page_id
<< " of datafile '" << m_filepath
<< "' could not be found in the doublewrite buffer.";
return(true);
}
ulint flags = mach_read_from_4(
FSP_HEADER_OFFSET + FSP_SPACE_FLAGS + page);
if (!fil_space_t::is_valid_flags(flags, m_space_id)) {
ulint cflags = fsp_flags_convert_from_101(flags);
if (cflags == ULINT_UNDEFINED) {
ib::warn()
<< "Ignoring a doublewrite copy of page "
<< page_id
<< " due to invalid flags " << ib::hex(flags);
return(true);
}
flags = cflags;
/* The flags on the page should be converted later. */
}
ulint physical_size = fil_space_t::physical_size(flags);
ut_a(page_get_page_no(page) == page_id.page_no());
ib::info() << "Restoring page " << page_id
<< " of datafile '" << m_filepath
<< "' from the doublewrite buffer. Writing "
<< physical_size << " bytes into file '"
<< m_filepath << "'";
IORequest request(IORequest::WRITE);
return(os_file_write(
request,
m_filepath, m_handle, page, 0, physical_size)
!= DB_SUCCESS);
}
/** Create a link filename based on the contents of m_name,
open that file, and read the contents into m_filepath.
@retval DB_SUCCESS if remote linked tablespace file is opened and read.
@retval DB_CANNOT_OPEN_FILE if the link file does not exist. */
dberr_t
RemoteDatafile::open_link_file()
{
if (m_link_filepath == NULL) {
m_link_filepath = fil_make_filepath(NULL, name(), ISL, false);
}
m_filepath = read_link_file(m_link_filepath);
return(m_filepath == NULL ? DB_CANNOT_OPEN_FILE : DB_SUCCESS);
}
/** Opens a handle to the file linked to in an InnoDB Symbolic Link file
in read-only mode so that it can be validated.
@param[in] strict whether to issue error messages
@return DB_SUCCESS if remote linked tablespace file is found and opened. */
dberr_t
RemoteDatafile::open_read_only(bool strict)
{
if (m_filepath == NULL && open_link_file() == DB_CANNOT_OPEN_FILE) {
return(DB_ERROR);
}
dberr_t err = Datafile::open_read_only(strict);
if (err != DB_SUCCESS && strict) {
/* The following call prints an error message */
os_file_get_last_error(true);
ib::error() << "A link file was found named '"
<< m_link_filepath << "' but the linked tablespace '"
<< m_filepath << "' could not be opened read-only.";
}
return(err);
}
/** Opens a handle to the file linked to in an InnoDB Symbolic Link file
in read-write mode so that it can be restored from doublewrite and validated.
@param[in] read_only_mode If true, then readonly mode checks are enforced.
@return DB_SUCCESS if remote linked tablespace file is found and opened. */
dberr_t
RemoteDatafile::open_read_write(bool read_only_mode)
{
if (m_filepath == NULL && open_link_file() == DB_CANNOT_OPEN_FILE) {
return(DB_ERROR);
}
dberr_t err = Datafile::open_read_write(read_only_mode);
if (err != DB_SUCCESS) {
/* The following call prints an error message */
m_last_os_error = os_file_get_last_error(true);
ib::error() << "A link file was found named '"
<< m_link_filepath << "' but the linked data file '"
<< m_filepath << "' could not be opened for writing.";
}
return(err);
}
/** Release the resources. */
void
RemoteDatafile::shutdown()
{
Datafile::shutdown();
if (m_link_filepath != 0) {
ut_free(m_link_filepath);
m_link_filepath = 0;
}
}
/** Creates a new InnoDB Symbolic Link (ISL) file. It is always created
under the 'datadir' of MySQL. The datadir is the directory of a
running mysqld program. We can refer to it by simply using the path ".".
@param[in] name tablespace name
@param[in] filepath remote filepath of tablespace datafile
@return DB_SUCCESS or error code */
dberr_t
RemoteDatafile::create_link_file(
const char* name,
const char* filepath)
{
bool success;
dberr_t err = DB_SUCCESS;
char* link_filepath = NULL;
char* prev_filepath = NULL;
ut_ad(!srv_read_only_mode);
ut_ad(0 == strcmp(&filepath[strlen(filepath) - 4], DOT_IBD));
link_filepath = fil_make_filepath(NULL, name, ISL, false);
if (link_filepath == NULL) {
return(DB_ERROR);
}
prev_filepath = read_link_file(link_filepath);
if (prev_filepath) {
/* Truncate will call this with an existing
link file which contains the same filepath. */
bool same = !strcmp(prev_filepath, filepath);
ut_free(prev_filepath);
if (same) {
ut_free(link_filepath);
return(DB_SUCCESS);
}
}
/** Check if the file already exists. */
FILE* file = NULL;
bool exists;
os_file_type_t ftype;
success = os_file_status(link_filepath, &exists, &ftype);
ulint error = 0;
if (success && !exists) {
file = fopen(link_filepath, "w");
if (file == NULL) {
/* This call will print its own error message */
error = os_file_get_last_error(true);
}
} else {
error = OS_FILE_ALREADY_EXISTS;
}
if (error != 0) {
ib::error() << "Cannot create file " << link_filepath << ".";
if (error == OS_FILE_ALREADY_EXISTS) {
ib::error() << "The link file: " << link_filepath
<< " already exists.";
err = DB_TABLESPACE_EXISTS;
} else if (error == OS_FILE_DISK_FULL) {
err = DB_OUT_OF_FILE_SPACE;
} else {
err = DB_ERROR;
}
/* file is not open, no need to close it. */
ut_free(link_filepath);
return(err);
}
ulint rbytes = fwrite(filepath, 1, strlen(filepath), file);
if (rbytes != strlen(filepath)) {
error = os_file_get_last_error(true);
ib::error() <<
"Cannot write link file: "
<< link_filepath << " filepath: " << filepath;
err = DB_ERROR;
}
/* Close the file, we only need it at startup */
fclose(file);
ut_free(link_filepath);
return(err);
}
/** Delete an InnoDB Symbolic Link (ISL) file. */
void
RemoteDatafile::delete_link_file(void)
{
ut_ad(m_link_filepath != NULL);
if (m_link_filepath != NULL) {
os_file_delete_if_exists(innodb_data_file_key,
m_link_filepath, NULL);
}
}
/** Delete an InnoDB Symbolic Link (ISL) file by name.
@param[in] name tablespace name */
void
RemoteDatafile::delete_link_file(
const char* name)
{
char* link_filepath = fil_make_filepath(NULL, name, ISL, false);
if (link_filepath != NULL) {
os_file_delete_if_exists(
innodb_data_file_key, link_filepath, NULL);
ut_free(link_filepath);
}
}
/** Read an InnoDB Symbolic Link (ISL) file by name.
It is always created under the datadir of MySQL.
For file-per-table tablespaces, the isl file is expected to be
in a 'database' directory and called 'tablename.isl'.
The caller must free the memory returned if it is not null.
@param[in] link_filepath filepath of the ISL file
@return Filepath of the IBD file read from the ISL file */
char*
RemoteDatafile::read_link_file(
const char* link_filepath)
{
FILE* file = fopen(link_filepath, "r+b" STR_O_CLOEXEC);
if (file == NULL) {
return(NULL);
}
char* filepath = static_cast<char*>(ut_malloc_nokey(OS_FILE_MAX_PATH));
os_file_read_string(file, filepath, OS_FILE_MAX_PATH);
fclose(file);
if (filepath[0] != '\0') {
/* Trim whitespace from end of filepath */
ulint last_ch = strlen(filepath) - 1;
while (last_ch > 4 && filepath[last_ch] <= 0x20) {
filepath[last_ch--] = 0x00;
}
os_normalize_path(filepath);
}
return(filepath);
}
|