/* Copyright (c) 2017, 2024, Oracle and/or its affiliates. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License, version 2.0, as published by the Free Software Foundation. This program is designed to work with certain software (including but not limited to OpenSSL) that is licensed under separate terms, as designated in a particular file or component or in included license documentation. The authors of MySQL hereby grant you an additional permission to link the program and your derivative works with the separately licensed software that they have either included with the program or referenced in the documentation. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License, version 2.0, for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */ #include "resource_group_mgr.h" #include "my_config.h" #include #include #include #include #include #include #include "map_helpers.h" #include "my_compiler.h" #include "my_psi_config.h" #include "my_sys.h" #include "mysql/components/services/bits/psi_bits.h" #include "mysql/components/services/log_builtins.h" // LogErr #include "mysql/psi/mysql_rwlock.h" #include "mysql/service_plugin_registry.h" #include "mysql/strings/m_ctype.h" #include "mysql/thread_type.h" #include "mysql_com.h" #include "mysqld_error.h" #include "pfs_thread_provider.h" #include "sql/auth/auth_acls.h" // SUPER_ACL #include "sql/auth/sql_security_ctx.h" #include "sql/current_thd.h" // current_thd #include "sql/dd/cache/dictionary_client.h" // Dictionary_client #include "sql/dd/dd_resource_group.h" // dd::create_resource_group #include "sql/dd/string_type.h" #include "sql/dd/types/resource_group.h" #include "sql/handler.h" #include "sql/log.h" // LogErr #include "sql/mysqld.h" // key_resource_group_mgr* #include "sql/resourcegroups/platform/thread_attrs_api.h" #include "sql/resourcegroups/resource_group.h" #include "sql/resourcegroups/thread_resource_control.h" #include "sql/sql_class.h" // class THD #include "sql/system_variables.h" #include "sql/thd_raii.h" #include "sql_string.h" // to_lex_cstring #include "string_with_len.h" namespace resourcegroups { const char *SYS_DEFAULT_RESOURCE_GROUP_NAME = "SYS_default"; const char *USR_DEFAULT_RESOURCE_GROUP_NAME = "USR_default"; Resource_group_mgr *Resource_group_mgr::m_instance = nullptr; void thread_create_callback(const PSI_thread_attrs *thread_attrs) { auto res_grp_mgr = resourcegroups::Resource_group_mgr::instance(); if (!res_grp_mgr->resource_group_support()) return; if (thread_attrs != nullptr) { const char *res_grp_name = thread_attrs->m_system_thread ? res_grp_mgr->sys_default_resource_group_name() : res_grp_mgr->usr_default_resource_group_name(); res_grp_mgr->set_res_grp_in_pfs(res_grp_name, strlen(res_grp_name), thread_attrs->m_thread_internal_id); } } void session_disconnect_callback(const PSI_thread_attrs *) { auto res_grp_mgr = resourcegroups::Resource_group_mgr::instance(); if (!res_grp_mgr->resource_group_support()) return; if (current_thd->resource_group_ctx()->m_cur_resource_group != nullptr) res_grp_mgr->move_resource_group( current_thd->resource_group_ctx()->m_cur_resource_group, res_grp_mgr->usr_default_resource_group()); } Resource_group_mgr *Resource_group_mgr::instance() { DBUG_TRACE; // Created during server startup. So no locking required. if (m_instance == nullptr) { m_instance = new (std::nothrow) Resource_group_mgr; assert(m_instance != nullptr); } return m_instance; } /** Persist an in-memory resource group to Data Dictionary. @param thd pointer to THD. @param resource_group Reference to the resource group to be persisted. @param update True if the resource groups exists and needs to be updated else resource group is created in DD. @returns true if resource group persistence to DD failed else false. */ static inline bool persist_resource_group( THD *thd, const resourcegroups::Resource_group &resource_group, bool update) { handlerton *ddse = ha_resolve_by_legacy_type(thd, DB_TYPE_INNODB); if (ddse->is_dict_readonly && ddse->is_dict_readonly()) { LogErr(WARNING_LEVEL, ER_RESOURCE_GROUP_METADATA_UPDATE_SKIPPED); return false; } Disable_autocommit_guard autocommit_guard(thd); dd::String_type name(resource_group.name().c_str()); bool res = update ? dd::update_resource_group(thd, name, resource_group) : dd::create_resource_group(thd, resource_group); if (res) { LogErr(ERROR_LEVEL, ER_FAILED_TO_PERSIST_RESOURCE_GROUP_METADATA, resource_group.name().c_str()); return true; } return false; } static bool deserialize_resource_groups(THD *thd) { DBUG_TRACE; /* Associate flag SYSTEM_THREAD_DD_INITIALIZE with THD context. This ensures we need not acquire MDL locks during initialization phase. */ thd->system_thread = SYSTEM_THREAD_DD_INITIALIZE; std::vector resource_group_vec; std::vector resource_group_ptr_vec; dd::cache::Dictionary_client::Auto_releaser releaser(thd->dd_client()); if (thd->dd_client()->fetch_global_components(&resource_group_vec)) return true; bool usr_default_in_dd = false; bool sys_default_in_dd = false; auto res_grp_mgr = Resource_group_mgr::instance(); for (const auto &resource_group : resource_group_vec) { if (my_strcasecmp(&my_charset_utf8mb3_general_ci, resource_group->name().c_str(), USR_DEFAULT_RESOURCE_GROUP_NAME) == 0) usr_default_in_dd = true; else if (my_strcasecmp(&my_charset_utf8mb3_general_ci, resource_group->name().c_str(), SYS_DEFAULT_RESOURCE_GROUP_NAME) == 0) sys_default_in_dd = true; else { auto resource_group_ptr = res_grp_mgr->deserialize_resource_group(resource_group); if (resource_group_ptr == nullptr) { LogErr(ERROR_LEVEL, ER_FAILED_TO_DESERIALIZE_RESOURCE_GROUP, resource_group->name().c_str()); return true; } resource_group_ptr_vec.push_back(resource_group_ptr); } } for (auto *resource_group_ptr : resource_group_ptr_vec) { // Validate the resource group and disable if validation is not successful auto thr_res_ctrl = resource_group_ptr->controller(); if (thr_res_ctrl->validate(resource_group_ptr->type())) { resource_group_ptr->set_enabled(false); // Update the resource group on-disk. Disable_autocommit_guard autocommit_guard(thd); if (dd::update_resource_group(thd, resource_group_ptr->name().c_str(), *resource_group_ptr)) { LogErr(WARNING_LEVEL, ER_FAILED_TO_UPDATE_RESOURCE_GROUP, resource_group_ptr->name().c_str()); return true; } LogErr(WARNING_LEVEL, ER_RESOURCE_GROUP_VALIDATION_FAILED, resource_group_ptr->name().c_str()); } } if (persist_resource_group(thd, *res_grp_mgr->usr_default_resource_group(), usr_default_in_dd)) return true; if (persist_resource_group(thd, *res_grp_mgr->sys_default_resource_group(), sys_default_in_dd)) return true; return false; } Resource_group *Resource_group_mgr::deserialize_resource_group( const dd::Resource_group *resource_group) { assert(m_resource_group_support); LEX_CSTRING name_cstr = to_lex_cstring(resource_group->name().c_str()); auto cpu_id_mask = resource_group->cpu_id_mask(); auto vcpu_range_vector = std::unique_ptr>( new (std::nothrow) std::vector); if (vcpu_range_vector.get() == nullptr) { LogErr(ERROR_LEVEL, ER_FAILED_TO_ALLOCATE_MEMORY_FOR_RESOURCE_GROUP, name_cstr.str); return nullptr; } int bit_start = -1, bit_end = -1; for (uint i = 0; i < cpu_id_mask.size(); i++) { if (cpu_id_mask[i]) bit_start == -1 ? (bit_start = bit_end = i) : (bit_end++); else if (bit_start != -1) { vcpu_range_vector->emplace_back(Range(bit_start, bit_end)); bit_start = bit_end = -1; } } auto resource_group_ptr = create_and_add_in_resource_group_hash( name_cstr, resource_group->resource_group_type(), resource_group->resource_group_enabled(), std::move(vcpu_range_vector), resource_group->thread_priority()); if (resource_group_ptr == nullptr) { LogErr(ERROR_LEVEL, ER_FAILED_TO_ADD_RESOURCE_GROUP_TO_MAP, name_cstr.str); return nullptr; } return resource_group_ptr; } bool Resource_group_mgr::acquire_shared_mdl_for_resource_group( THD *thd, const char *res_grp_name, enum_mdl_duration lock_duration, MDL_ticket **ticket, bool try_acquire) { DBUG_TRACE; MDL_key mdl_key; dd::Resource_group::create_mdl_key(res_grp_name, &mdl_key); MDL_request mdl_request; MDL_REQUEST_INIT_BY_KEY(&mdl_request, &mdl_key, MDL_INTENTION_EXCLUSIVE, lock_duration); bool res = try_acquire ? thd->mdl_context.acquire_lock(&mdl_request, 0) : thd->mdl_context.acquire_lock( &mdl_request, thd->variables.lock_wait_timeout); if (!res && ticket != nullptr) *ticket = mdl_request.ticket; return res; } void Resource_group_mgr::deinit() { if (m_resource_group_support && m_notify_svc != nullptr) { m_notify_svc->unregister_notification(m_notify_handle); m_registry_svc->release(m_h_res_grp_svc); m_h_res_grp_svc = nullptr; m_registry_svc->release(m_h_notification_svc); m_h_notification_svc = nullptr; mysql_plugin_registry_release(m_registry_svc); delete m_resource_group_hash; mysql_rwlock_destroy(&m_map_rwlock); } } bool Resource_group_mgr::post_init() { DBUG_TRACE; if (!m_resource_group_support) return false; if (!m_thread_priority_available) LogErr(INFORMATION_LEVEL, ER_THREAD_PRIORITY_IGNORED); // Create temporary THD to read Resource groups from disk. std::unique_ptr thd(new (std::nothrow) THD()); if (thd.get() == nullptr) return true; thd->thread_stack = reinterpret_cast(&thd); thd->store_globals(); thd->security_context()->set_master_access(SUPER_ACL); thd->variables.transaction_read_only = false; thd->tx_read_only = false; bool res = deserialize_resource_groups(thd.get()); return res; } bool Resource_group_mgr::init() { DBUG_TRACE; #ifndef WITH_PERFSCHEMA_STORAGE_ENGINE // WITH_PERFSCHEMA_STORAGE_ENGINE is always set. static_assert(0, "WITH_PERFSCHEMA_STORAGE_ENGINE not defined."); #endif if (!platform::is_platform_supported()) { m_unsupport_reason = "Platform Unsupported"; return false; } #ifdef DISABLE_PSI_THREAD // Resource group not supported with DISABLE_PSI_THREAD. m_resource_group_support = false; LogErr(INFORMATION_LEVEL, ER_RESOURCE_GROUP_IS_DISABLED); m_unsupport_reason = "Server compiled with DISABLE_PSI_THREAD"; return false; #endif m_resource_group_support = true; mysql_rwlock_init(key_rwlock_resource_group_mgr_map_lock, &m_map_rwlock); m_thread_priority_available = platform::can_thread_priority_be_set(); m_registry_svc = mysql_plugin_registry_acquire(); if (!m_registry_svc) { LogErr(WARNING_LEVEL, ER_COMPONENTS_FAILED_TO_ACQUIRE_SERVICE_IMPLEMENTATION, "registry"); return true; } if (m_registry_svc->acquire("pfs_resource_group_v3", &m_h_res_grp_svc)) { LogErr(WARNING_LEVEL, ER_COMPONENTS_FAILED_TO_ACQUIRE_SERVICE_IMPLEMENTATION, "pfs_resource_group_v3"); return true; } m_resource_group_svc = reinterpret_cast(m_h_res_grp_svc); if (m_registry_svc->acquire("pfs_notification_v3", &m_h_notification_svc)) { LogErr(WARNING_LEVEL, ER_COMPONENTS_FAILED_TO_ACQUIRE_SERVICE_IMPLEMENTATION, "pfs_notification_v3"); return true; } m_notify_svc = reinterpret_cast( m_h_notification_svc); // Register thread creation notification callbacks. PSI_notification callbacks; memset(&callbacks, 0, sizeof(callbacks)); callbacks.thread_create = &thread_create_callback; callbacks.session_disconnect = &session_disconnect_callback; m_notify_handle = m_notify_svc->register_notification(&callbacks, false); if (m_notify_handle == 0) { LogErr(WARNING_LEVEL, ER_PFS_NOTIFICATION_FUNCTION_REGISTER_FAILED, "Thread creation"); return true; } m_resource_group_hash = new collation_unordered_map>( &my_charset_utf8mb3_tolower_ci, PSI_INSTRUMENT_ME); if (m_resource_group_hash == nullptr) { LogErr(ERROR_LEVEL, ER_FAILED_TO_ALLOCATE_MEMORY_FOR_RESOURCE_GROUP_HASH); return true; } m_usr_default_resource_group = new (std::nothrow) Resource_group(USR_DEFAULT_RESOURCE_GROUP_NAME, resourcegroups::Type::USER_RESOURCE_GROUP, true); if (m_usr_default_resource_group == nullptr) { LogErr(ERROR_LEVEL, ER_FAILED_TO_ALLOCATE_MEMORY_FOR_RESOURCE_GROUP, "USR_default"); delete m_resource_group_hash; m_resource_group_hash = nullptr; return true; } m_sys_default_resource_group = new (std::nothrow) Resource_group(SYS_DEFAULT_RESOURCE_GROUP_NAME, resourcegroups::Type::SYSTEM_RESOURCE_GROUP, true); if (m_sys_default_resource_group == nullptr) { LogErr(ERROR_LEVEL, ER_FAILED_TO_ALLOCATE_MEMORY_FOR_RESOURCE_GROUP, "SYS_default"); delete m_resource_group_hash; m_resource_group_hash = nullptr; delete m_usr_default_resource_group; m_usr_default_resource_group = nullptr; return true; } add_resource_group( std::unique_ptr(m_usr_default_resource_group)); add_resource_group( std::unique_ptr(m_sys_default_resource_group)); // Initialize number of VCPUs. m_num_vcpus = platform::num_vcpus(); return false; } bool Resource_group_mgr::move_resource_group(Resource_group *from_res_grp, Resource_group *to_res_grp) { assert(m_resource_group_support); if (to_res_grp == nullptr) to_res_grp = m_usr_default_resource_group; if (from_res_grp == to_res_grp) return false; if (to_res_grp->controller()->apply_control()) { LogErr(WARNING_LEVEL, ER_FAILED_TO_APPLY_RESOURCE_GROUP_CONTROLLER, to_res_grp->name().c_str()); return false; } // Set resource group name in PFS. ulonglong pfs_thread_id = 0; #ifdef HAVE_PSI_THREAD_INTERFACE pfs_thread_id = PSI_THREAD_CALL(get_current_thread_internal_id)(); #endif m_resource_group_svc->set_thread_resource_group_by_id( nullptr, pfs_thread_id, to_res_grp->name().c_str(), to_res_grp->name().length(), nullptr); if (from_res_grp != nullptr && !is_resource_group_default(from_res_grp)) from_res_grp->remove_pfs_thread_id(pfs_thread_id); if (!is_resource_group_default(to_res_grp)) to_res_grp->add_pfs_thread_id(pfs_thread_id); return true; } void Resource_group_mgr::destroy_instance() { if (m_instance != nullptr) { m_instance->deinit(); delete m_instance; m_instance = nullptr; } } Resource_group *Resource_group_mgr::get_resource_group( const std::string &resource_group_name) { DBUG_TRACE; assert(m_resource_group_support); Resource_group *resource_group = nullptr; mysql_rwlock_rdlock(&m_map_rwlock); auto resource_group_iter = m_resource_group_hash->find(resource_group_name); if (resource_group_iter != m_resource_group_hash->end()) resource_group = resource_group_iter->second.get(); mysql_rwlock_unlock(&m_map_rwlock); return resource_group; } bool Resource_group_mgr::add_resource_group( std::unique_ptr resource_group_ptr) { DBUG_TRACE; assert(m_resource_group_support); mysql_rwlock_wrlock(&m_map_rwlock); m_resource_group_hash->emplace(resource_group_ptr->name(), std::move(resource_group_ptr)); mysql_rwlock_unlock(&m_map_rwlock); return false; } void Resource_group_mgr::remove_resource_group(const std::string &name) { DBUG_TRACE; assert(m_resource_group_support); mysql_rwlock_wrlock(&m_map_rwlock); m_resource_group_hash->erase(name); mysql_rwlock_unlock(&m_map_rwlock); } Resource_group *Resource_group_mgr::create_and_add_in_resource_group_hash( const LEX_CSTRING &name, Type type, bool enabled, std::unique_ptr> vcpu_range_vector, int priority) { DBUG_TRACE; assert(m_resource_group_support); auto resource_group_ptr = new (std::nothrow) Resource_group(std::string(name.str), type, enabled); if (resource_group_ptr == nullptr) { my_error(ER_OUTOFMEMORY, MYF(ME_FATALERROR), 0); return nullptr; } auto thr_res_ctrl = resource_group_ptr->controller(); thr_res_ctrl->set_priority(priority); thr_res_ctrl->set_vcpu_vector(*vcpu_range_vector); // add to in-memory hash Resource_group_mgr::instance()->add_resource_group( std::unique_ptr(resource_group_ptr)); return resource_group_ptr; } #ifndef NDEBUG bool Resource_group_mgr::disable_pfs_notification() { if (!m_resource_group_support || m_notify_svc == nullptr) return false; m_notify_svc->unregister_notification(m_notify_handle); m_notify_handle = 0; return false; } #endif bool Resource_group_mgr::switch_resource_group_if_needed( THD *thd, resourcegroups::Resource_group **src_res_grp, resourcegroups::Resource_group **dest_res_grp, MDL_ticket **ticket, MDL_ticket **cur_ticket) { bool switched = false; auto res_grp_name = thd->resource_group_ctx()->m_switch_resource_group_str; if (!opt_initialize && res_grp_name[0] != '\0') { resourcegroups::Resource_group_mgr *mgr_instance = resourcegroups::Resource_group_mgr::instance(); if (mgr_instance->acquire_shared_mdl_for_resource_group( thd, res_grp_name, MDL_EXPLICIT, ticket, false)) { LogErr(WARNING_LEVEL, ER_FAILED_TO_ACQUIRE_LOCK_ON_RESOURCE_GROUP, res_grp_name); res_grp_name[0] = '\0'; return false; } auto resource_group = mgr_instance->get_resource_group(res_grp_name); if (resource_group == nullptr) { thd->resource_group_ctx()->m_warn = WARN_RESOURCE_GROUP_NOT_EXISTS; return false; } Security_context *sctx = thd->security_context(); if (!(sctx->has_global_grant(STRING_WITH_LEN("RESOURCE_GROUP_ADMIN")) .first || sctx->has_global_grant(STRING_WITH_LEN("RESOURCE_GROUP_USER")) .first)) { thd->resource_group_ctx()->m_warn = WARN_RESOURCE_GROUP_ACCESS_DENIED; } // Do not allow SYSTEM resource group to bind with a session thread. if (resource_group->type() == resourcegroups::Type::SYSTEM_RESOURCE_GROUP) { thd->resource_group_ctx()->m_warn = WARN_RESOURCE_GROUP_TYPE_MISMATCH; return false; } mysql_mutex_lock(&thd->LOCK_thd_data); *src_res_grp = thd->resource_group_ctx()->m_cur_resource_group; *dest_res_grp = resource_group; if (*src_res_grp == *dest_res_grp) { mysql_mutex_unlock(&thd->LOCK_thd_data); return false; } const char *src_res_grp_str = *src_res_grp != nullptr ? (*src_res_grp)->name().c_str() : nullptr; if (src_res_grp_str != nullptr && mgr_instance->acquire_shared_mdl_for_resource_group( thd, src_res_grp_str, MDL_EXPLICIT, cur_ticket, true)) { LogErr(WARNING_LEVEL, ER_FAILED_TO_ACQUIRE_LOCK_ON_RESOURCE_GROUP, src_res_grp_str); mysql_mutex_unlock(&thd->LOCK_thd_data); res_grp_name[0] = '\0'; return false; } assert(*dest_res_grp != nullptr); switched = mgr_instance->move_resource_group(*src_res_grp, *dest_res_grp); mysql_mutex_unlock(&thd->LOCK_thd_data); DBUG_EXECUTE_IF("pause_after_rg_switch", { const char act[] = "now SIGNAL execute_pfs_select " "WAIT_FOR signal_to_continue"; assert(!debug_sync_set_action(thd, STRING_WITH_LEN(act))); };); } return switched; } } // namespace resourcegroups