chef/cookbooks/mysql/recipes/ha_galera.rb from crowbar/crowbar-openstack

chef/cookbooks/mysql/recipes/ha_galera.rb
Summary

Maintainability

2 hrs
Test Coverage

Issues
#
# Cookbook Name:: mysql
# Recipe:: ha_galera
#
# Copyright 2017, SUSE Linux GmbH.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

resource_agent = "ocf:heartbeat:galera"

node[:mysql][:galera_packages].each do |p|
  package p
end

directory "/var/run/mysql/" do
  owner "mysql"
  group "root"
  mode "0755"
  action :create
end

directory "/var/lib/mysql/" do
  owner "mysql"
  group "root"
  mode "0700"
  action :create
end

node_address = Chef::Recipe::Barclamp::Inventory.get_network_by_type(node, "admin").address

# This is needed because the single node bootstrap cluster will take a
# while until it reports "Sync". If that takes too long, user creation will
# fail.
early_sync_retry_delay = 10
early_sync_retries = 2

unless node[:database][:galera_bootstrapped]
  if CrowbarPacemakerHelper.is_cluster_founder?(node)
    case node[:platform_family]
    when "rhel", "fedora"
      mysql_service_name = "mysqld"
    else
      mysql_service_name = "mysql"
    end

    # This may still be running from a previous failed run. If it does, it will
    # hold various locks on files in /var/lib/mysql, which will cause
    # mysql_install_db to fail with a timeout.
    service "ensure mysql-temp is stopped" do
      service_name mysql_service_name
      supports status: true, restart: true, reload: true
      action :stop
      notifies :run, "execute[mysql_install_db]", :immediately
    end

    execute "mysql_install_db" do
      command "mysql_install_db"
      action :nothing
    end

    # To bootstrap for the first time, start galera on one node
    # to set up the seed sst and monitoring users.

    template "temporary bootstrap /etc/my.cnf.d/75-galera.cnf" do
      path "/etc/my.cnf.d/75-galera.cnf"
      source "galera.cnf.erb"
      owner "root"
      group "mysql"
      mode "0640"
      variables(
        cluster_addresses: "gcomm://",
        sstuser: "root",
        sstuser_password: "",
        expire_logs_days: node[:database][:mysql][:expire_logs_days],
        node_address: node_address,
        wsrep_slave_threads: node[:database][:mysql][:wsrep_slave_threads],
        gcs_fc_limit_multiplier: node[:database][:mysql][:gcs_fc_limit_multiplier],
        gcs_fc_factor: node[:database][:mysql][:gcs_fc_factor],
        wsrep_provider_options_custom: node[:database][:mysql][:wsrep_provider_options_custom].join(";")
      )
    end

    # use the initial root:'' credentials to set up the new user. The
    # unauthenticated root user is later removed in server.rb after the
    # bootstraping. Once the cluster has started other nodes will pick up on
    # the sstuser and we are able to use these credentails.
    db_settings = fetch_database_settings
    db_connection = db_settings[:connection].dup
    db_connection[:host] = "localhost"
    db_connection[:username] = "root"
    db_connection[:password] = ""
    db_connection[:ssl] = {}

    service "mysql-temp start" do
      service_name mysql_service_name
      supports status: true, restart: true, reload: true
      action :start
    end

    execute "Test WSREP state early" do
      retries early_sync_retries
      retry_delay early_sync_retry_delay
      command "mysql -u 'monitoring' -N -B " \
        "-e \"SHOW STATUS WHERE Variable_name='wsrep_local_state_comment';\" | grep Synced"
      action :run
    end

    database_user "create state snapshot transfer user" do
      connection db_connection
      username "sstuser"
      password node[:database][:mysql][:sstuser_password]
      host "localhost"
      provider db_settings[:user_provider]
      action :create
    end

    database_user "grant sstuser root privileges" do
      connection db_connection
      username "sstuser"
      password node[:database][:mysql][:sstuser_password]
      host "localhost"
      provider db_settings[:user_provider]
      action :grant
    end

    database_user "create haproxy and galera monitoring user" do
      connection db_connection
      username "monitoring"
      password ""
      host "%"
      provider db_settings[:user_provider]
      action :create
    end

    service "mysql-temp stop" do
      service_name mysql_service_name
      supports status: true, restart: true, reload: true
      action :stop
    end
  end
end

service_name = "galera"

cluster_nodes = CrowbarPacemakerHelper.cluster_nodes(node)
nodes_names = cluster_nodes.map { |n| n[:hostname] }

cluster_addresses = "gcomm://" + nodes_names.join(",")

template "/etc/my.cnf.d/75-galera.cnf" do
  source "galera.cnf.erb"
  owner "root"
  group "mysql"
  mode "0640"
  variables(
    cluster_addresses: cluster_addresses,
    sstuser: "sstuser",
    sstuser_password: node[:database][:mysql][:sstuser_password],
    expire_logs_days: node[:database][:mysql][:expire_logs_days],
    node_address: node_address,
    wsrep_slave_threads: node[:database][:mysql][:wsrep_slave_threads],
    gcs_fc_limit_multiplier: node[:database][:mysql][:gcs_fc_limit_multiplier],
    gcs_fc_factor: node[:database][:mysql][:gcs_fc_factor],
    wsrep_provider_options_custom: node[:database][:mysql][:wsrep_provider_options_custom].join(";")
  )
end

file "/etc/my.cnf.d/galera.cnf" do
  action :delete
  notifies :restart, "service[mysql]"
end

# Configuration files for galera-python-clustercheck
template "/etc/galera-python-clustercheck/galera-python-clustercheck.conf" do
  source "galera-python-clustercheck.conf.erb"
  owner "galera-python-clustercheck"
  group "mysql"
  mode "0640"
  variables(
    node_address: node_address
  )
end

template "/etc/galera-python-clustercheck/my.cnf" do
  source "galera-python-clustercheck-my.cnf.erb"
  owner "galera-python-clustercheck"
  group "mysql"
  mode "0640"
  variables(
    node_address: node_address
  )
end

# Wait for all nodes to reach this point so we know that all nodes will have
# all the required packages and configurations installed before we create the
# pacemaker resources
crowbar_pacemaker_sync_mark "sync-database_before_ha" do
  timeout node[:database][:mysql][:presync_timeout] + (early_sync_retry_delay * early_sync_retries)
  revision node[:database]["crowbar-revision"]
end

transaction_objects = []

# Avoid races when creating pacemaker resources
crowbar_pacemaker_sync_mark "wait-database_ha_resources" do
  revision node[:database]["crowbar-revision"]
end

# some of the op attributes are now in the proposal, so we need to merge the
# default attributes and the proposal attributes (that actually completely
# override the default attributes, even the ones not defined in the proposal)
primitive_op = node.default_attrs[:mysql][:ha][:op].to_hash
primitive_op.merge!(node[:database][:mysql][:ha][:op].to_hash)

pacemaker_primitive service_name do
  agent resource_agent
  params({
    "enable_creation" => true,
    "wsrep_cluster_address" => cluster_addresses,
    "check_user" => "monitoring",
    "check_passwd_use_empty" => 1,
    "socket" => "/var/run/mysql/mysql.sock",
    "datadir" => node[:database][:mysql][:datadir],
    "log" => "/var/log/mysql/mysqld.log"
  })
  op primitive_op
  action :update
  only_if { CrowbarPacemakerHelper.is_cluster_founder?(node) }
end

transaction_objects.push("pacemaker_primitive[#{service_name}]")

ms_name = "ms-#{service_name}"
pacemaker_ms ms_name do
  rsc service_name
  meta(
    "master-max" => nodes_names.size,
    "clone-max" => nodes_names.size,
    "ordered" => "false",
    "interleave" => "false",
    "notify" => "true"
  )
  action :update
  only_if { CrowbarPacemakerHelper.is_cluster_founder?(node) }
end

transaction_objects.push("pacemaker_ms[#{ms_name}]")

ms_location_name = openstack_pacemaker_controller_location_ignoring_upgrade_for ms_name
transaction_objects << "pacemaker_location[#{ms_location_name}]"

pacemaker_transaction "galera service" do
  cib_objects transaction_objects
  # note that this will also automatically start the resources
  action :commit_new
  only_if { CrowbarPacemakerHelper.is_cluster_founder?(node) }
end

crowbar_pacemaker_sync_mark "create-database_ha_resources" do
  revision node[:database]["crowbar-revision"]
end

# The pacemaker galera resources agent will now bootstrap the cluster.
# Which might take a while. Wait for that to complete by watching the
# "wsrep_local_state_comment" status variable on all cluster nodes to reach
# the "Synced" state, before continuing with the rest of the recipe.
ruby_block "wait galera bootstrap" do
  seconds = node[:database][:mysql][:bootstrap_timeout]
  block do
    require "timeout"
    begin
      cmd = "mysql -u 'monitoring' -N -B " \
        "-e \"SHOW STATUS WHERE Variable_name='wsrep_local_state_comment';\" | cut -f 2"
      sync_state = ""
      Timeout.timeout(seconds) do
        while sync_state != "Synced"
          sleep(1)
          get_state = Mixlib::ShellOut.new(cmd).run_command
          sync_state = get_state.stdout.chop
        end
      end
    rescue Timeout::Error
      message = "Galera cluster did not start after #{seconds} seconds. " \
        "Check pacemaker and mysql log files manually for possible errors."
      Chef::Log.fatal(message)
      raise message
    end
  end
  not_if { node[:database][:galera_bootstrapped] }
end

ruby_block "mark node for galera bootstrap" do
  block do
    node.set[:database][:galera_bootstrapped] = true
    node.save
  end
  not_if { node[:database][:galera_bootstrapped] }
end

crowbar_pacemaker_sync_mark "sync-database_boostrapped" do
  # to be on the safe side we need to wait at least as long as the other nodes might
  # need for bootstrapping (see the 'ruby_block "wait galera bootstrap"' above)
  timeout node[:database][:mysql][:bootstrap_timeout] + 10
  revision node[:database]["crowbar-revision"]
end

execute "assign-root-password-galera" do
  command "/usr/bin/mysqladmin -u root \
    password \"#{node[:database][:mysql][:server_root_password]}\""
  action :run
  only_if { CrowbarPacemakerHelper.is_cluster_founder?(node) }
  only_if "/usr/bin/mysql --no-defaults -u root -e 'select (1);'"
end

crowbar_pacemaker_sync_mark "sync-database_root_password" do
  revision node[:database]["crowbar-revision"]
end

# Start galera-clustercheck which serves the cluster state as http return codes
# on port 5555
transaction_objects = []
service_name = "galera-python-clustercheck"

clustercheck_op = {}
clustercheck_op["monitor"] = {}
clustercheck_op["monitor"]["interval"] = "10s"

pacemaker_primitive service_name do
  agent "systemd:#{service_name}"
  op clustercheck_op
  action :update
  only_if { CrowbarPacemakerHelper.is_cluster_founder?(node) }
end

transaction_objects.push("pacemaker_primitive[#{service_name}]")

clone_name = "cl-#{service_name}"
pacemaker_clone clone_name do
  rsc service_name
  meta CrowbarPacemakerHelper.clone_meta(node, remote: false)
  action :update
  only_if { CrowbarPacemakerHelper.is_cluster_founder?(node) }
end

transaction_objects.push("pacemaker_clone[#{clone_name}]")

clone_location_name = openstack_pacemaker_controller_location_ignoring_upgrade_for clone_name
transaction_objects << "pacemaker_location[#{clone_location_name}]"

pacemaker_transaction "clustercheck" do
  cib_objects transaction_objects
  action :commit_new
  only_if { CrowbarPacemakerHelper.is_cluster_founder?(node) }
end

include_recipe "crowbar-pacemaker::haproxy"

ha_servers = CrowbarPacemakerHelper.haproxy_servers_for_service(
  node, "mysql", "database-server", "admin_port"
)

# Let all nodes but one act as backup (standby) servers.
# Backup server is only used when non-backup one is down. Thus we prevent possible deadlocks
# from OpenStack services writing to the database on different nodes at once.
ha_servers = ha_servers.each do |n|
  # Let the current node be non-backup one, so haproxy running on this node does
  # not direct traffic elsewhere by default
  n["backup"] = n["name"] != node["hostname"]
  # lower the number of unsuccessful checks needed for declaring server DOWN
  n["fall"] = 2
  # lower the interval checking after first failure is found
  n["fastinter"] = 1000
  # shutdown connection when backend is marked down
  n["on_marked_down_shutdown"] = true
end

haproxy_loadbalancer "galera" do
  address CrowbarPacemakerHelper.cluster_vip(node, "admin")
  port 3306
  mode "tcp"
  # leave some room for pacemaker health checks
  max_connections node[:database][:mysql][:max_connections] - 10
  options ["httpchk", "clitcpka"]
  default_server "port 5555"
  stick ({ "on" => "dst" })
  servers ha_servers
  action :nothing
end.run_action(:create)