Skip to content

Instantly share code, notes, and snippets.

@whitehat101
Created November 22, 2016 06:18
Show Gist options
  • Save whitehat101/19efdb92e106a276a60ec5eb0565f14c to your computer and use it in GitHub Desktop.
Save whitehat101/19efdb92e106a276a60ec5eb0565f14c to your computer and use it in GitHub Desktop.
God configuration with CPU & memory monitoring and email notifications
# Thanks: https://github.com/dotgee/geoauth/blob/78e859b2d4ca5cd5788aeb3c3a64f2ccc92202dc/config/puma.god
ROOT = "/var/www/app/rails/development/geoauth"
God.pid_file_directory = "#{ROOT}/tmp/pids"
# rails_env = ENV['RAILS_ENV'] || 'production'
rails_env = ENV['RAILS_ENV'] || 'development'
rails_root = ENV['RAILS_ROOT'] || ROOT
God::Contacts::Email.defaults do |d|
d.from_email = '[email protected]'
d.from_name = 'God Watcher'
d.delivery_method = :sendmail
end
God.contact(:email) do |c|
c.name = 'xymox'
c.group = 'admins'
c.to_email = '[email protected]'
end
God.watch do |w|
w.name = "puma"
w.interval = 10.seconds # default
# unicorn needs to be run from the rails root
w.start = "cd #{rails_root} && bundle exec puma -b unix://#{rails_root}/tmp/sockets/puma.sock -q --pidfile #{rails_root}/tmp/pids/puma.pid"
# QUIT gracefully shuts down workers
w.stop = "kill -TERM `cat #{rails_root}/tmp/pids/puma.pid`"
# USR2 causes the master to re-create itself and spawn a new worker pool
w.restart = "kill -USR2 `cat #{rails_root}/tmp/pids/puma.pid`"
w.start_grace = 10.seconds
w.restart_grace = 10.seconds
w.pid_file = "#{rails_root}/tmp/pids/puma.pid"
#w.uid = 'xymox'
#w.gid = 'rvm'
w.behavior(:clean_pid_file)
w.start_if do |start|
start.condition(:process_running) do |c|
c.interval = 5.seconds
c.running = false
end
end
w.restart_if do |restart|
restart.condition(:memory_usage) do |c|
c.above = 100.megabytes
c.times = [3, 5] # 3 out of 5 intervals
end
restart.condition(:cpu_usage) do |c|
c.above = 50.percent
c.times = 5
end
end
# lifecycle
w.lifecycle do |on|
on.condition(:flapping) do |c|
c.to_state = [:start, :restart]
c.times = 5
c.within = 5.minute
c.transition = :unmonitored
c.retry_in = 10.minutes
c.retry_times = 5
c.retry_within = 2.hours
end
end
end
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment