/* Copyright (c) 2020, 2024, Oracle and/or its affiliates. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License, version 2.0, as published by the Free Software Foundation. This program is designed to work with certain software (including but not limited to OpenSSL) that is licensed under separate terms, as designated in a particular file or component or in included license documentation. The authors of MySQL hereby grant you an additional permission to link the program and your derivative works with the separately licensed software that they have either included with the program or referenced in the documentation. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License, version 2.0, for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */ #include "mysql/strings/collations.h" #include #include #include #include #include #include "mysql/strings/m_ctype.h" #include "strings/collations_internal.h" // TODO(geb): MY_CS_BUFFER_SIZE seems unreasonably large -- MY_CS_NAME_SIZE-1 // should be enough. constexpr static size_t MY_CS_BUFFER_SIZE = static_cast(MY_CS_NAME_SIZE) * 8; mysql::collation::Name::Name(const char *name) : mysql::collation::Name::Name(name, name != nullptr ? strlen(name) : 0) {} mysql::collation::Name::Name(const char *name, size_t size) { if (name == nullptr) { // TODO(gleb): throw std::invalid_argument instead? assert(false); name = ""; } // TODO(gleb): fail instead of truncating too long names? size_t truncated_size = std::min(size, MY_CS_BUFFER_SIZE); char *normalized = new char[truncated_size + 1]; for (size_t i = 0; i < truncated_size; i++) { // TODO(gleb): use ASCII instead of Latin1? normalized[i] = static_cast( my_charset_latin1.to_lower[static_cast(name[i])]); } normalized[truncated_size] = '\0'; m_normalized = normalized; } mysql::collation::Name::Name(const mysql::collation::Name &name) { size_t size = strlen(name.m_normalized); char *normalized = new char[size + 1]; memcpy(normalized, name.m_normalized, size + 1); m_normalized = normalized; } mysql::collation::Name::Name(mysql::collation::Name &&name) noexcept : m_normalized(name.m_normalized) { name.m_normalized = nullptr; } mysql::collation::Name::~Name() { delete[] m_normalized; } /// @cond Doxygen_is_confused mysql::collation::Name &mysql::collation::Name::Name::operator=( const Name &name) { if (this == &name) { return *this; } this->~Name(); new (this) Name(name); return *this; } mysql::collation::Name &mysql::collation::Name::Name::operator=( Name &&name) noexcept { if (this != &name) { this->~Name(); new (this) Name(std::move(name)); } return *this; } /// @endcond void mysql::collation::initialize(const char *charset_dir, MY_CHARSET_LOADER *loader) { assert(mysql::collation_internals::entry == nullptr); mysql::collation_internals::entry = new mysql::collation_internals::Collations{charset_dir, loader}; } void mysql::collation::shutdown() { delete mysql::collation_internals::entry; mysql::collation_internals::entry = nullptr; } static auto entry() { return mysql::collation_internals::entry; } const CHARSET_INFO *mysql::collation::find_by_name(const Name &name) { return entry()->find_by_name(name); } const CHARSET_INFO *mysql::collation::find_by_id(unsigned id) { return entry()->find_by_id(id); } const CHARSET_INFO *mysql::collation::find_primary(Name cs_name) { // Needed by lexer, to parse e.g. "select _utf8 0xD0B0D0B1D0B2;" if (cs_name() == "utf8") { // Uncomment to catch unwanted use of "utf8". // assert(false); cs_name = Name("utf8mb3"); } return entry()->find_primary(cs_name); } const CHARSET_INFO *mysql::collation::find_default_binary(const Name &cs_name) { return entry()->find_default_binary(cs_name); }