2013-12-12 01:33:01 +00:00

377 lines
13 KiB
Ruby

#
# Cookbook Name:: postgresql
# Library:: default
# Author:: David Crane (<davidc@donorschoose.org>)
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
include Chef::Mixin::ShellOut
module Opscode
module PostgresqlHelpers
#######
# Function to truncate value to 4 significant bits, render human readable.
# Used in recipes/config_initdb.rb to set this attribute:
#
# The memory settings (shared_buffers, effective_cache_size, work_mem,
# maintenance_work_mem and wal_buffers) will be rounded down to keep
# the 4 most significant bits, so that SHOW will be likely to use a
# larger divisor. The output is actually a human readable string that
# ends with "GB", "MB" or "kB" if over 1023, exactly what Postgresql
# will expect in a postgresql.conf setting. The output may be up to
# 6.25% less than the original value because of the rounding.
def binaryround(value)
# Keep a multiplier which grows through powers of 1
multiplier = 1
# Truncate value to 4 most significant bits
while value >= 16
value = (value / 2).floor
multiplier = multiplier * 2
end
# Factor any remaining powers of 2 into the multiplier
while value == 2*((value / 2).floor)
value = (value / 2).floor
multiplier = multiplier * 2
end
# Factor enough powers of 2 back into the value to
# leave the multiplier as a power of 1024 that can
# be represented as units of "GB", "MB" or "kB".
if multiplier >= 1024*1024*1024
while multiplier > 1024*1024*1024
value = 2*value
multiplier = (multiplier/2).floor
end
multiplier = 1
units = "GB"
elsif multiplier >= 1024*1024
while multiplier > 1024*1024
value = 2*value
multiplier = (multiplier/2).floor
end
multiplier = 1
units = "MB"
elsif multiplier >= 1024
while multiplier > 1024
value = 2*value
multiplier = (multiplier/2).floor
end
multiplier = 1
units = "kB"
else
units = ""
end
# Now we can return a nice human readable string.
return "#{multiplier * value}#{units}"
end
#######
# Locale Configuration
# Function to test the date order.
# Used in recipes/config_initdb.rb to set this attribute:
# node.default['postgresql']['config']['datestyle']
def locale_date_order
# Test locale conversion of mon=11, day=22, year=33
testtime = DateTime.new(2033,11,22,0,0,0,"-00:00")
#=> #<DateTime: 2033-11-22T00:00:00-0000 ...>
# %x - Preferred representation for the date alone, no time
res = testtime.strftime("%x")
if res.nil?
return 'mdy'
end
posM = res.index("11")
posD = res.index("22")
posY = res.index("33")
if (posM.nil? || posD.nil? || posY.nil?)
return 'mdy'
elseif (posY < posM && posM < posD)
return 'ymd'
elseif (posD < posM)
return 'dmy'
else
return 'mdy'
end
end
#######
# Timezone Configuration
require 'find'
# Function to determine where the system stored shared timezone data.
# Used in recipes/config_initdb.rb to detemine where it should have
# select_default_timezone(tzdir) search.
def pg_TZDIR()
# System time zone conversions are controlled by a timezone data file
# identified through environment variables (TZ and TZDIR) and/or file
# and directory naming conventions specific to the Linux distribution.
# Each of these timezone names will have been loaded into the PostgreSQL
# pg_timezone_names view by the package maintainer.
#
# Instead of using the timezone name configured as the system default,
# the PostgreSQL server uses ones named in postgresql.conf settings
# (timezone and log_timezone). The initdb utility does initialize those
# settings to the timezone name that corresponds to the system default.
#
# The system's timezone name is actually a filename relative to the
# shared zoneinfo directory. That is usually /usr/share/zoneinfo, but
# it was /usr/lib/zoneinfo in older distributions and can be anywhere
# if specified by the environment variable TZDIR. The tzset(3) manpage
# seems to indicate the following precedence:
tzdir = nil
if ::File.directory?("/usr/lib/zoneinfo")
tzdir = "/usr/lib/zoneinfo"
else
share_path = [ ENV['TZDIR'], "/usr/share/zoneinfo" ].compact.first
if ::File.directory?(share_path)
tzdir = share_path
end
end
return tzdir
end
#######
# Function to support select_default_timezone(tzdir), which is
# used in recipes/config_initdb.rb.
def validate_zone(tzname)
# PostgreSQL does not support leap seconds, so this function tests
# the usual Linux tzname convention to avoid a misconfiguration.
# Assume that the tzdata package maintainer has kept all timezone
# data files with support for leap seconds is kept under the
# so-named "right/" subdir of the shared zoneinfo directory.
#
# The original PostgreSQL initdb is not Unix-specific, so it did a
# very complicated, thorough test in its pg_tz_acceptable() function
# that I could not begin to understand how to do in ruby :).
#
# Testing the tzname is good enough, since a misconfiguration
# will result in an immediate fatal error when the PostgreSQL
# service is started, with pgstartup.log messages such as:
# LOG: time zone "right/US/Eastern" appears to use leap seconds
# DETAIL: PostgreSQL does not support leap seconds.
if tzname.index("right/") == 0
return false
else
return true
end
end
# Function to support select_default_timezone(tzdir), which is
# used in recipes/config_initdb.rb.
def scan_available_timezones(tzdir)
# There should be an /etc/localtime zoneinfo file that is a link to
# (or a copy of) a timezone data file under tzdir, which should have
# been installed under the "share" directory by the tzdata package.
#
# The initdb utility determines which shared timezone file is being
# used as the system's default /etc/localtime. The timezone name is
# the timezone file path relative to the tzdir.
bestzonename = nil
if (tzdir.nil?)
Chef::Log.error("The zoneinfo directory not found (looked for /usr/share/zoneinfo and /usr/lib/zoneinfo)")
elsif !::File.exists?("/etc/localtime")
Chef::Log.error("The system zoneinfo file not found (looked for /etc/localtime)")
elsif ::File.directory?("/etc/localtime")
Chef::Log.error("The system zoneinfo file not found (/etc/localtime is a directory instead)")
elsif ::File.symlink?("/etc/localtime")
# PostgreSQL initdb doesn't use the symlink target, but this
# certainly will make sense to any system administrator. A full
# scan of the tzdir to find the shortest filename could result
# "US/Eastern" instead of "America/New_York" as bestzonename,
# in spite of what the sysadmin had specified in the symlink.
# (There are many duplicates under tzdir, with the same timezone
# content appearing as an average of 2-3 different file names.)
path = ::File.readlink("/etc/localtime")
bestzonename = path.gsub("#{tzdir}/","")
else # /etc/localtime is a file, so scan for it under tzdir
localtime_content = File.read("/etc/localtime")
Find.find(tzdir) do |path|
# Only consider files (skip directories or symlinks)
if !::File.directory?(path) && !::File.symlink?(path)
# Ignore any file named "posixrules" or "localtime"
if ::File.basename(path) != "posixrules" && ::File.basename(path) != "localtime"
# Do consider if content exactly matches /etc/localtime.
if localtime_content == File.read(path)
tzname = path.gsub("#{tzdir}/","")
if validate_zone(tzname)
if (bestzonename.nil? ||
tzname.length < bestzonename.length ||
(tzname.length == bestzonename.length &&
(tzname <=> bestzonename) < 0)
)
bestzonename = tzname
end
end
end
end
end
end
end
return bestzonename
end
# Function to support select_default_timezone(tzdir), which is
# used in recipes/config_initdb.rb.
def identify_system_timezone(tzdir)
resultbuf = scan_available_timezones(tzdir)
if !resultbuf.nil?
# Ignore Olson's rather silly "Factory" zone; use GMT instead
if (resultbuf <=> "Factory") == 0
resultbuf = nil
end
else
# Did not find the timezone. Fallback to use a GMT zone. Note that the
# Olson timezone database names the GMT-offset zones in POSIX style: plus
# is west of Greenwich.
testtime = DateTime.now
std_ofs = testtime.strftime("%:z").split(":")[0].to_i
resultbuf = [
"Etc/GMT",
(-std_ofs > 0) ? "+" : "",
(-std_ofs).to_s
].join('')
end
return resultbuf
end
#######
# Function to determine the name of the system's default timezone.
# Used in recipes/config_initdb.rb to set these attributes:
# node.default['postgresql']['config']['log_timezone']
# node.default['postgresql']['config']['timezone']
def select_default_timezone(tzdir)
system_timezone = nil
# Check TZ environment variable
tzname = ENV['TZ']
if !tzname.nil? && !tzname.empty? && validate_zone(tzname)
system_timezone = tzname
else
# Nope, so try to identify system timezone from /etc/localtime
tzname = identify_system_timezone(tzdir)
if validate_zone(tzname)
system_timezone = tzname
end
end
return system_timezone
end
#######
# Function to determine the name of the system's default timezone.
def get_result_orig(query)
# query could be a String or an Array of String
if (query.is_a?(String))
stdin = query
else
stdin = query.join("\n")
end
@get_result ||= begin
cmd = shell_out("cat", :input => stdin)
cmd.stdout
end
end
#######
# Function to execute an SQL statement in the template1 database.
# Input: Query could be a single String or an Array of String.
# Output: A String with |-separated columns and \n-separated rows.
# Note an empty output could mean psql couldn't connect.
# This is easiest for 1-field (1-row, 1-col) results, otherwise
# it will be complex to parse the results.
def execute_sql(query)
# query could be a String or an Array of String
statement = query.is_a?(String) ? query : query.join("\n")
@execute_sql ||= begin
cmd = shell_out("psql -q --tuples-only --no-align -d template1 -f -",
:user => "postgres",
:input => statement
)
# If psql fails, generally the postgresql service is down.
# Instead of aborting chef with a fatal error, let's just
# pass these non-zero exitstatus back as empty cmd.stdout.
if (cmd.exitstatus() == 0 and !cmd.stderr.empty?)
# An SQL failure is still a zero exitstatus, but then the
# stderr explains the error, so let's rais that as fatal.
Chef::Log.fatal("psql failed executing this SQL statement:\n#{statement}")
Chef::Log.fatal(cmd.stderr)
raise "SQL ERROR"
end
cmd.stdout.chomp
end
end
#######
# Function to determine if a standard contrib extension is already installed.
# Input: Extension name
# Output: true or false
# Best use as a not_if gate on bash "install-#{pg_ext}-extension" resource.
def extension_installed?(pg_ext)
@extension_installed ||= begin
installed=execute_sql("select 'installed' from pg_extension where extname = '#{pg_ext}';")
installed =~ /^installed$/
end
end
######################################
# Function to build information needed to install RPM for PGDG yum repository,
# since PGDG supports several versions of PostgreSQL, platforms, platform versions
# and architectures.
# Links to RPMs for installation are in an attribute so that new versions/platforms
# can be more easily added. (See attributes/default.rb)
def pgdgrepo_rpm_info
repo_rpm_url = node['postgresql']['pgdg']['repo_rpm_url'].
fetch(node['postgresql']['version']). # e.g., fetch for "9.1"
fetch(node['platform']). # e.g., fetch for "centos"
fetch(node['platform_version'].to_f.to_i.to_s). # e.g., fetch for "5" (truncated "5.7")
fetch(node['kernel']['machine']) # e.g., fetch for "i386" or "x86_64"
# Extract the filename portion from the URL for the PGDG repository RPM.
# E.g., repo_rpm_filename = "pgdg-centos92-9.2-6.noarch.rpm"
repo_rpm_filename = File.basename(repo_rpm_url)
# Extract the package name from the URL for the PGDG repository RPM.
# E.g., repo_rpm_package = "pgdg-centos92"
repo_rpm_package = repo_rpm_filename.split(/-/,3)[0..1].join('-')
return [ repo_rpm_url, repo_rpm_filename, repo_rpm_package ]
end
# End the Opscode::PostgresqlHelpers module
end
end