/***************************************************************************** Copyright (c) 1996, 2016, Oracle and/or its affiliates. All Rights Reserved. Copyright (c) 2017, 2020, MariaDB Corporation. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; version 2 of the License. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1335 USA *****************************************************************************/ /**************************************************//** @file include/data0type.h Data types Created 1/16/1996 Heikki Tuuri *******************************************************/ #ifndef data0type_h #define data0type_h #include "univ.i" /** Special length indicating a missing instantly added column */ #define UNIV_SQL_DEFAULT (UNIV_SQL_NULL - 1) /** @return whether a length is actually stored in a field */ #define len_is_stored(len) (len != UNIV_SQL_NULL && len != UNIV_SQL_DEFAULT) extern ulint data_mysql_default_charset_coll; #define DATA_MYSQL_BINARY_CHARSET_COLL 63 /* SQL data type struct */ struct dtype_t; /** SQL Like operator comparison types */ enum ib_like_t { IB_LIKE_EXACT, /**< e.g. STRING */ IB_LIKE_PREFIX /**< e.g., STRING% */ }; /*-------------------------------------------*/ /* The 'MAIN TYPE' of a column */ #define DATA_MISSING 0 /* missing column */ #define DATA_VARCHAR 1 /* character varying of the latin1_swedish_ci charset-collation; note that the MySQL format for this, DATA_BINARY, DATA_VARMYSQL, is also affected by whether the 'precise type' contains DATA_MYSQL_TRUE_VARCHAR */ #define DATA_CHAR 2 /* fixed length character of the latin1_swedish_ci charset-collation */ #define DATA_FIXBINARY 3 /* binary string of fixed length */ #define DATA_BINARY 4 /* binary string */ #define DATA_BLOB 5 /* binary large object, or a TEXT type; if prtype & DATA_BINARY_TYPE == 0, then this is actually a TEXT column (or a BLOB created with < 4.0.14; since column prefix indexes came only in 4.0.14, the missing flag in BLOBs created before that does not cause any harm) */ #define DATA_INT 6 /* integer: can be any size 1 - 8 bytes */ #define DATA_SYS_CHILD 7 /* address of the child page in node pointer */ #define DATA_SYS 8 /* system column */ /* Data types >= DATA_FLOAT must be compared using the whole field, not as binary strings */ #define DATA_FLOAT 9 #define DATA_DOUBLE 10 #define DATA_DECIMAL 11 /* decimal number stored as an ASCII string */ #define DATA_VARMYSQL 12 /* any charset varying length char */ #define DATA_MYSQL 13 /* any charset fixed length char */ /* NOTE that 4.1.1 used DATA_MYSQL and DATA_VARMYSQL for all character sets, and the charset-collation for tables created with it can also be latin1_swedish_ci */ /* DATA_GEOMETRY includes all standard geometry datatypes as described in OGC standard(point, line_string, polygon, multi_point, multi_polygon, multi_line_string, geometry_collection, geometry). Currently, geometry data is stored in the standard Well-Known Binary(WKB) format (http://www.opengeospatial.org/standards/sfa). We use BLOB as the underlying datatype. */ #define DATA_GEOMETRY 14 /* geometry datatype of variable length */ #define DATA_MTYPE_MAX 63 /* dtype_store_for_order_and_null_size() requires the values are <= 63 */ #define DATA_MTYPE_CURRENT_MIN DATA_VARCHAR /* minimum value of mtype */ #define DATA_MTYPE_CURRENT_MAX DATA_GEOMETRY /* maximum value of mtype */ /*-------------------------------------------*/ /* The 'PRECISE TYPE' of a column */ /* Tables created by a MySQL user have the following convention: - In the least significant byte in the precise type we store the MySQL type code (not applicable for system columns). - In the second least significant byte we OR flags DATA_NOT_NULL, DATA_UNSIGNED, DATA_BINARY_TYPE. - In the third least significant byte of the precise type of string types we store the MySQL charset-collation code. In DATA_BLOB columns created with < 4.0.14 we do not actually know if it is a BLOB or a TEXT column. Since there are no indexes on prefixes of BLOB or TEXT columns in < 4.0.14, this is no problem, though. Note that versions < 4.1.2 or < 5.0.1 did not store the charset code to the precise type, since the charset was always the default charset of the MySQL installation. If the stored charset code is 0 in the system table SYS_COLUMNS of InnoDB, that means that the default charset of this MySQL installation should be used. When loading a table definition from the system tables to the InnoDB data dictionary cache in main memory, InnoDB versions >= 4.1.2 and >= 5.0.1 check if the stored charset-collation is 0, and if that is the case and the type is a non-binary string, replace that 0 by the default charset-collation code of this MySQL installation. In short, in old tables, the charset-collation code in the system tables on disk can be 0, but in in-memory data structures (dtype_t), the charset-collation code is always != 0 for non-binary string types. In new tables, in binary string types, the charset-collation code is the MySQL code for the 'binary charset', that is, != 0. For binary string types and for DATA_CHAR, DATA_VARCHAR, and for those DATA_BLOB which are binary or have the charset-collation latin1_swedish_ci, InnoDB performs all comparisons internally, without resorting to the MySQL comparison functions. This is to save CPU time. InnoDB's own internal system tables have different precise types for their columns, and for them the precise type is usually not used at all. */ #define DATA_ENGLISH 4 /* English language character string: this is a relic from pre-MySQL time and only used for InnoDB's own system tables */ #define DATA_ERROR 111 /* another relic from pre-MySQL time */ #define DATA_MYSQL_TYPE_MASK 255U/* AND with this mask to extract the MySQL type from the precise type */ #define DATA_MYSQL_TRUE_VARCHAR 15 /* MySQL type code for the >= 5.0.3 format true VARCHAR */ /* Precise data types for system columns and the length of those columns; NOTE: the values must run from 0 up in the order given! All codes must be less than 256 */ #define DATA_ROW_ID 0 /* row id: a 48-bit integer */ #define DATA_ROW_ID_LEN 6 /* stored length for row id */ #define DATA_TRX_ID 1 /* transaction id: 6 bytes */ #define DATA_TRX_ID_LEN 6 #define DATA_ROLL_PTR 2 /* rollback data pointer: 7 bytes */ #define DATA_ROLL_PTR_LEN 7 #define DATA_N_SYS_COLS 3 /* number of system columns defined above */ #define DATA_FTS_DOC_ID 3 /* Used as FTS DOC ID column */ #define DATA_SYS_PRTYPE_MASK 0xFU /* mask to extract the above from prtype */ /* Flags ORed to the precise data type */ #define DATA_NOT_NULL 256U /* this is ORed to the precise type when the column is declared as NOT NULL */ #define DATA_UNSIGNED 512U /* this id ORed to the precise type when we have an unsigned integer type */ #define DATA_BINARY_TYPE 1024U /* if the data type is a binary character string, this is ORed to the precise type: this only holds for tables created with >= MySQL-4.0.14 */ /* #define DATA_NONLATIN1 2048 This is a relic from < 4.1.2 and < 5.0.1. In earlier versions this was set for some BLOB columns. */ #define DATA_GIS_MBR 2048U /* Used as GIS MBR column */ /** the size of a GIS maximum bounding rectangle */ constexpr uint8_t DATA_MBR_LEN= uint8_t(SPDIMS * 2 * sizeof(double)); #define DATA_LONG_TRUE_VARCHAR 4096U /* this is ORed to the precise data type when the column is true VARCHAR where MySQL uses 2 bytes to store the data len; for shorter VARCHARs MySQL uses only 1 byte */ #define DATA_VIRTUAL 8192U /* Virtual column */ /** System Versioning */ #define DATA_VERS_START 16384U /* start system field */ #define DATA_VERS_END 32768U /* end system field */ /** system-versioned user data column */ #define DATA_VERSIONED (DATA_VERS_START|DATA_VERS_END) /** Check whether locking is disabled (never). */ #define dict_table_is_locking_disabled(table) false /*-------------------------------------------*/ /* This many bytes we need to store the type information affecting the alphabetical order for a single field and decide the storage size of an SQL null*/ #define DATA_ORDER_NULL_TYPE_BUF_SIZE 4 /* In the >= 4.1.x storage format we add 2 bytes more so that we can also store the charset-collation number; one byte is left unused, though */ #define DATA_NEW_ORDER_NULL_TYPE_BUF_SIZE 6 /* Maximum multi-byte character length in bytes, plus 1 */ #define DATA_MBMAX 8 /* For checking if mtype is GEOMETRY datatype */ #define DATA_GEOMETRY_MTYPE(mtype) ((mtype) == DATA_GEOMETRY) /* For checking if mtype is BLOB or GEOMETRY, since we use BLOB as the underlying datatype of GEOMETRY data. */ #define DATA_LARGE_MTYPE(mtype) ((mtype) == DATA_BLOB \ || (mtype) == DATA_GEOMETRY) /* For checking if data type is big length data type. */ #define DATA_BIG_LEN_MTYPE(len, mtype) ((len) > 255 || DATA_LARGE_MTYPE(mtype)) /* For checking if the column is a big length column. */ #define DATA_BIG_COL(col) DATA_BIG_LEN_MTYPE((col)->len, (col)->mtype) /* For checking if data type is large binary data type. */ #define DATA_LARGE_BINARY(mtype,prtype) ((mtype) == DATA_GEOMETRY || \ ((mtype) == DATA_BLOB && !((prtype) & DATA_BINARY_TYPE))) /* We now support 15 bits (up to 32767) collation number */ #define MAX_CHAR_COLL_NUM 32767 /* Mask to get the Charset Collation number (0x7fff) */ #define CHAR_COLL_MASK MAX_CHAR_COLL_NUM /*********************************************************************//** Gets the MySQL type code from a dtype. @return MySQL type code; this is NOT an InnoDB type code! */ UNIV_INLINE ulint dtype_get_mysql_type( /*=================*/ const dtype_t* type); /*!< in: type struct */ /*********************************************************************//** Determine how many bytes the first n characters of the given string occupy. If the string is shorter than n characters, returns the number of bytes the characters in the string occupy. @return length of the prefix, in bytes */ ulint dtype_get_at_most_n_mbchars( /*========================*/ ulint prtype, /*!< in: precise type */ ulint mbminlen, /*!< in: minimum length of a multi-byte character, in bytes */ ulint mbmaxlen, /*!< in: maximum length of a multi-byte character, in bytes */ ulint prefix_len, /*!< in: length of the requested prefix, in characters, multiplied by dtype_get_mbmaxlen(dtype) */ ulint data_len, /*!< in: length of str (in bytes) */ const char* str); /*!< in: the string whose prefix length is being determined */ /** @return whether main type is a string type */ inline bool dtype_is_string_type(ulint mtype) { return mtype <= DATA_BLOB || mtype == DATA_MYSQL || mtype == DATA_VARMYSQL; } /** @return whether a type is a binary string type */ inline bool dtype_is_binary_string_type(ulint mtype, ulint prtype) { /* Note that for tables created before MySQL 4.0.14, we do not know if a DATA_BLOB column is a BLOB or a TEXT column. For those DATA_BLOB columns we return false. */ return mtype == DATA_FIXBINARY || mtype == DATA_BINARY || (mtype == DATA_BLOB && (prtype & DATA_BINARY_TYPE)); } /** @return whether a type is a non-binary string type */ inline bool dtype_is_non_binary_string_type(ulint mtype, ulint prtype) { return dtype_is_string_type(mtype) && !dtype_is_binary_string_type(mtype, prtype); } /*********************************************************************//** Sets a data type structure. */ UNIV_INLINE void dtype_set( /*======*/ dtype_t* type, /*!< in: type struct to init */ ulint mtype, /*!< in: main data type */ ulint prtype, /*!< in: precise type */ ulint len); /*!< in: precision of type */ /*********************************************************************//** Copies a data type structure. */ UNIV_INLINE void dtype_copy( /*=======*/ dtype_t* type1, /*!< in: type struct to copy to */ const dtype_t* type2); /*!< in: type struct to copy from */ /*********************************************************************//** Gets the SQL main data type. @return SQL main data type */ UNIV_INLINE ulint dtype_get_mtype( /*============*/ const dtype_t* type); /*!< in: data type */ /*********************************************************************//** Gets the precise data type. @return precise data type */ UNIV_INLINE ulint dtype_get_prtype( /*=============*/ const dtype_t* type); /*!< in: data type */ /*********************************************************************//** Compute the mbminlen and mbmaxlen members of a data type structure. */ UNIV_INLINE void dtype_get_mblen( /*============*/ ulint mtype, /*!< in: main type */ ulint prtype, /*!< in: precise type (and collation) */ unsigned* mbminlen, /*!< out: minimum length of a multi-byte character */ unsigned* mbmaxlen); /*!< out: maximum length of a multi-byte character */ /** Get the charset-collation code for string types. @param prtype InnoDB precise type @return charset-collation code */ inline uint16_t dtype_get_charset_coll(ulint prtype) { return static_cast(prtype >> 16) & CHAR_COLL_MASK; } /** Form a precise type from the < 4.1.2 format precise type plus the charset-collation code. @param[in] old_prtype MySQL type code and the flags DATA_BINARY_TYPE etc. @param[in] charset_coll character-set collation code @return precise type, including the charset-collation code */ UNIV_INLINE uint32_t dtype_form_prtype(ulint old_prtype, ulint charset_coll) { ut_ad(old_prtype < 256 * 256); ut_ad(charset_coll <= MAX_CHAR_COLL_NUM); return(uint32_t(old_prtype + (charset_coll << 16))); } /*********************************************************************//** Determines if a MySQL string type is a subset of UTF-8. This function may return false negatives, in case further character-set collation codes are introduced in MySQL later. @return whether a subset of UTF-8 */ UNIV_INLINE bool dtype_is_utf8( /*==========*/ ulint prtype);/*!< in: precise data type */ /*********************************************************************//** Gets the type length. @return fixed length of the type, in bytes, or 0 if variable-length */ UNIV_INLINE ulint dtype_get_len( /*==========*/ const dtype_t* type); /*!< in: data type */ /*********************************************************************//** Gets the minimum length of a character, in bytes. @return minimum length of a char, in bytes, or 0 if this is not a character type */ UNIV_INLINE ulint dtype_get_mbminlen( /*===============*/ const dtype_t* type); /*!< in: type */ /*********************************************************************//** Gets the maximum length of a character, in bytes. @return maximum length of a char, in bytes, or 0 if this is not a character type */ UNIV_INLINE ulint dtype_get_mbmaxlen( /*===============*/ const dtype_t* type); /*!< in: type */ /***********************************************************************//** Returns the size of a fixed size data type, 0 if not a fixed size type. @return fixed size, or 0 */ UNIV_INLINE unsigned dtype_get_fixed_size_low( /*=====================*/ ulint mtype, /*!< in: main type */ ulint prtype, /*!< in: precise type */ ulint len, /*!< in: length */ ulint mbminlen, /*!< in: minimum length of a multibyte character, in bytes */ ulint mbmaxlen, /*!< in: maximum length of a multibyte character, in bytes */ ulint comp); /*!< in: nonzero=ROW_FORMAT=COMPACT */ /***********************************************************************//** Returns the minimum size of a data type. @return minimum size */ UNIV_INLINE unsigned dtype_get_min_size_low( /*===================*/ ulint mtype, /*!< in: main type */ ulint prtype, /*!< in: precise type */ ulint len, /*!< in: length */ ulint mbminlen, /*!< in: minimum length of a character */ ulint mbmaxlen); /*!< in: maximum length of a character */ /***********************************************************************//** Returns the maximum size of a data type. Note: types in system tables may be incomplete and return incorrect information. @return maximum size */ UNIV_INLINE ulint dtype_get_max_size_low( /*===================*/ ulint mtype, /*!< in: main type */ ulint len); /*!< in: length */ /***********************************************************************//** Returns the ROW_FORMAT=REDUNDANT stored SQL NULL size of a type. For fixed length types it is the fixed length of the type, otherwise 0. @return SQL null storage size in ROW_FORMAT=REDUNDANT */ UNIV_INLINE ulint dtype_get_sql_null_size( /*====================*/ const dtype_t* type, /*!< in: type */ ulint comp); /*!< in: nonzero=ROW_FORMAT=COMPACT */ /**********************************************************************//** Reads to a type the stored information which determines its alphabetical ordering and the storage size of an SQL NULL value. */ UNIV_INLINE void dtype_read_for_order_and_null_size( /*===============================*/ dtype_t* type, /*!< in: type struct */ const byte* buf); /*!< in: buffer for the stored order info */ /**********************************************************************//** Stores for a type the information which determines its alphabetical ordering and the storage size of an SQL NULL value. This is the >= 4.1.x storage format. */ UNIV_INLINE void dtype_new_store_for_order_and_null_size( /*====================================*/ byte* buf, /*!< in: buffer for DATA_NEW_ORDER_NULL_TYPE_BUF_SIZE bytes where we store the info */ const dtype_t* type, /*!< in: type struct */ ulint prefix_len);/*!< in: prefix length to replace type->len, or 0 */ /**********************************************************************//** Reads to a type the stored information which determines its alphabetical ordering and the storage size of an SQL NULL value. This is the 4.1.x storage format. */ UNIV_INLINE void dtype_new_read_for_order_and_null_size( /*===================================*/ dtype_t* type, /*!< in: type struct */ const byte* buf); /*!< in: buffer for stored type order info */ /*********************************************************************//** Returns the type's SQL name (e.g. BIGINT UNSIGNED) from mtype,prtype,len @return the SQL type name */ UNIV_INLINE char* dtype_sql_name( /*===========*/ unsigned mtype, /*!< in: mtype */ unsigned prtype, /*!< in: prtype */ unsigned len, /*!< in: len */ char* name, /*!< out: SQL name */ unsigned name_sz);/*!< in: size of the name buffer */ /*********************************************************************//** Validates a data type structure. @return TRUE if ok */ ibool dtype_validate( /*===========*/ const dtype_t* type); /*!< in: type struct to validate */ #ifdef UNIV_DEBUG /** Print a data type structure. @param[in] type data type */ void dtype_print( const dtype_t* type); #endif /* UNIV_DEBUG */ /* Structure for an SQL data type. If you add fields to this structure, be sure to initialize them everywhere. This structure is initialized in the following functions: dtype_set() dtype_read_for_order_and_null_size() dtype_new_read_for_order_and_null_size() sym_tab_add_null_lit() */ struct dtype_t{ unsigned prtype:32; /*!< precise type; MySQL data type, charset code, flags to indicate nullability, signedness, whether this is a binary string, whether this is a true VARCHAR where MySQL uses 2 bytes to store the length */ unsigned mtype:8; /*!< main data type */ /* the remaining fields do not affect alphabetical ordering: */ unsigned len:16; /*!< length; for MySQL data this is field->pack_length(), except that for a >= 5.0.3 type true VARCHAR this is the maximum byte length of the string data (in addition to the string, MySQL uses 1 or 2 bytes to store the string length) */ unsigned mbminlen:3; /*!< minimum length of a character, in bytes */ unsigned mbmaxlen:3; /*!< maximum length of a character, in bytes */ /** @return whether this is system versioned user field */ bool is_versioned() const { return !(~prtype & DATA_VERSIONED); } /** @return whether this is the system field start */ bool vers_sys_start() const { return (prtype & DATA_VERSIONED) == DATA_VERS_START; } /** @return whether this is the system field end */ bool vers_sys_end() const { return (prtype & DATA_VERSIONED) == DATA_VERS_END; } /** Set the type of the BLOB in the hidden metadata record. */ void metadata_blob_init() { prtype = DATA_NOT_NULL; mtype = DATA_BLOB; len = 0; mbminlen = 0; mbmaxlen = 0; } }; /** The DB_TRX_ID,DB_ROLL_PTR values for "no history is available" */ extern const byte reset_trx_id[DATA_TRX_ID_LEN + DATA_ROLL_PTR_LEN]; /** Info bit denoting the predefined minimum record: this bit is set if and only if the record is the first user record on a non-leaf B-tree page that is the leftmost page on its level (PAGE_LEVEL is nonzero and FIL_PAGE_PREV is FIL_NULL). */ #define REC_INFO_MIN_REC_FLAG 0x10UL /** The delete-mark flag in info bits */ #define REC_INFO_DELETED_FLAG 0x20UL /** Record status values for ROW_FORMAT=COMPACT,DYNAMIC,COMPRESSED */ enum rec_comp_status_t { /** User record (PAGE_LEVEL=0, heap>=PAGE_HEAP_NO_USER_LOW) */ REC_STATUS_ORDINARY = 0, /** Node pointer record (PAGE_LEVEL>=0, heap>=PAGE_HEAP_NO_USER_LOW) */ REC_STATUS_NODE_PTR = 1, /** The page infimum pseudo-record (heap=PAGE_HEAP_NO_INFIMUM) */ REC_STATUS_INFIMUM = 2, /** The page supremum pseudo-record (heap=PAGE_HEAP_NO_SUPREMUM) */ REC_STATUS_SUPREMUM = 3, /** Clustered index record that has been inserted or updated after instant ADD COLUMN (more than dict_index_t::n_core_fields) */ REC_STATUS_INSTANT = 4 }; /** The dtuple_t::info_bits of the hidden metadata of instant ADD COLUMN. @see rec_is_metadata() @see rec_is_alter_metadata() */ static const byte REC_INFO_METADATA_ADD = REC_INFO_MIN_REC_FLAG | REC_STATUS_INSTANT; /** The dtuple_t::info_bits of the hidden metadata of instant ALTER TABLE. @see rec_is_metadata() */ static const byte REC_INFO_METADATA_ALTER = REC_INFO_METADATA_ADD | REC_INFO_DELETED_FLAG; #include "data0type.ic" #endif