Files
neocities/workers/lets_encrypt_worker.rb
T
2026-05-12 15:29:46 -05:00

307 lines
9.7 KiB
Ruby

require 'digest'
class LetsEncryptWorker
class VerificationTimeoutError < StandardError; end
class FinalizeTimeoutError < StandardError; end
include Sidekiq::Worker
sidekiq_options queue: :lets_encrypt_worker, retry: 10, backtrace: true
CERT_RENEWAL_WINDOW = 30.days
ACME_RATE_LIMIT_KEY_PREFIX = 'lets_encrypt_worker:rate_limited'
ACME_RATE_LIMIT_RETRY_JITTER = 30.minutes
sidekiq_retry_in do |count|
5.minutes.to_i * count
end
# If you need to clear scheduled jobs:
# Sidekiq::ScheduledSet.new.select {|s| JSON.parse(s.value)['class'] == 'LetsEncryptWorker'}.each {|j| j.delete}
DIRECTORY = 'https://acme-v02.api.letsencrypt.org/directory'
STAGING_DIRECTORY = 'https://acme-staging-v02.api.letsencrypt.org/directory'
def letsencrypt
Acme::Client.new(
private_key: OpenSSL::PKey::RSA.new(File.read($config['letsencrypt_key'])),
directory: (ENV['RACK_ENV'] == 'production' ? DIRECTORY : STAGING_DIRECTORY)
)
end
def perform(site_id)
# Dispose of dupes
queue = Sidekiq::Queue.new self.class.sidekiq_options_hash['queue']
queue.each do |job|
if job.args == [site_id] && job.jid != jid
job.delete
end
end
site = Site[site_id]
return if site.domain.blank? || site.is_deleted
return if site.values[:domain].match /\.neocities\.org$/i
domain_raw = site.values[:domain].gsub(/^www\./, '')
domains = [domain_raw, "www.#{domain_raw}"]
verified_domains = []
domains.each_with_index do |domain, index|
puts "verifying accessability of test file on #{domain}"
challenge_base_path = File.join '.well-known', 'acme-challenge'
testfile_name, testfile_key = "test#{SecureRandom.uuid}", SecureRandom.hex
testfile_fs_path = File.join site.base_files_path, challenge_base_path
begin
FileUtils.mkdir_p File.join(site.base_files_path, challenge_base_path)
File.write File.join(testfile_fs_path, testfile_name), testfile_key
rescue => e
puts "ERROR WRITING TO WELLKNOWN FILE, FAILING ON THIS SITE: #{site.username} #{domain}: #{e.inspect}"
return
end
# Ensure that both domains work before sending request. Let's Encrypt has a low
# pending request limit, and it takes one week (!) to flush out.
challenge_url = "http://#{domain}/#{challenge_base_path}/#{testfile_name}"
puts "testing #{challenge_url}"
begin
# Some dumb letsencrypt related cert expiration issue hotfix
ctx = OpenSSL::SSL::SSLContext.new
ctx.verify_mode = OpenSSL::SSL::VERIFY_NONE
res = HTTP.timeout(connect: 10, write: 10, read: 10).follow.get(challenge_url, ssl_context: ctx)
rescue => e
puts e.inspect
puts "error with #{challenge_url}"
next
end
if res.body.to_s == testfile_key
puts "match: #{challenge_url}"
verified_domains << domain
else
puts "CONTENT DOWNLOADED DID NOT MATCH #{challenge_url}"
next
end
end
if verified_domains.empty? || (site.created_at.year >= 2017 && !verified_domains.include?(domain_raw))
puts "no verified domains, skipping cert setup, reporting invalid domain"
# This is a bit of an inappropriate shared responsibility,
# but since were here, it looks like the domain is dead, so let's
# try again a few times, but then pull the domain out of our system
# if it looks like it's gone completely.
if site.domain_fail_count < 60
site.domain_fail_count += 1
site.save_changes validate: false
else
old_domain = site.domain
site.domain = nil
site.domain_fail_count = 0
site.save validate: false
site.send_email(
subject: "[Neocities] Your domain has stopped working",
body: Tilt.new('./views/templates/email/domain_fail.erb', pretty: true).render(self, site: site, domain: old_domain)
)
end
clean_wellknown_turds site
if site.domain_fail_count > 0
LetsEncryptWorker.perform_in((5.minutes * site.domain_fail_count), site.id)
end
return
end
if active_certificate_covers?(site, verified_domains)
puts "existing certificate covers #{verified_domains.join(', ')}, skipping cert setup"
if site.domain_fail_count.to_i > 0
site.domain_fail_count = 0
site.save_changes validate: false
end
clean_wellknown_turds site
return
end
if (retry_at = acme_rate_limited_until(verified_domains))
puts "ACME order for #{verified_domains.join(', ')} rate limited until #{retry_at.utc}"
schedule_acme_rate_limited_retry site, verified_domains, retry_at
clean_wellknown_turds site
return
end
finalized_domains = []
begin
order = letsencrypt.new_order identifiers: verified_domains
order.authorizations.each do |authorization|
challenge = authorization.http
if challenge.nil?
puts "challenge object is nil, going to next domain"
next
end
begin
FileUtils.mkdir_p File.join(site.base_files_path, File.dirname(challenge.filename))
File.write File.join(site.base_files_path, challenge.filename), challenge.file_content
rescue => e
puts "FAILED TO WRITE CHALLENGE: #{site.domain} #{challenge.filename}"
# A verification needs to be attempted anyways, otherwise 300 of them will jam up the system for a week
end
challenge.request_validation
sleep 1
attempts = 0
while true
result = challenge.status
puts "#{authorization.domain} : #{result}"
if result == 'valid'
puts "VALIDATED: #{authorization.domain}"
clean_wellknown_turds site
finalized_domains.push authorization.domain
break
end
raise VerificationTimeoutError if attempts == 60
if result == 'invalid'
puts "returned invalid (#{authorization.domain}, walking away"
clean_wellknown_turds site
break
end
attempts += 1
challenge.reload
sleep 2
end
end
clean_wellknown_turds site
csr = Acme::Client::CertificateRequest.new names: finalized_domains
order.finalize csr: csr
attempts = 0
while order.status == 'processing'
raise FinalizeTimeoutError if attempts > 60
attempts += 1
sleep 1
end
site.ssl_key = csr.private_key.to_pem
site.ssl_cert = order.certificate
site.cert_updated_at = Time.now
site.domain_fail_count = 0
site.save_changes validate: false
rescue Acme::Client::Error::RateLimited => e
puts "ACME order for #{verified_domains.join(', ')} rate limited: #{e.message}"
schedule_acme_rate_limited_retry site, verified_domains, e.retry_after_time
clean_wellknown_turds site
return
end
# Refresh the cert periodically, current expire time is 90 days
# We're going for a cron task for this now, so this is commented out.
#LetsEncryptWorker.perform_in 60.days, site.id
end
def clean_wellknown_turds(site)
wellknown_path = File.join site.base_files_path, '.well-known'
acme_challenge_path = File.join wellknown_path, 'acme-challenge'
site.site_files_dataset.where(Sequel.like(:path, '.well-known/acme-challenge%')).each do |s|
s.destroy
end
Dir.glob(File.join(acme_challenge_path, '*')).each do |f|
FileUtils.rm f
end
if Dir.exist?(acme_challenge_path)
Dir.rmdir acme_challenge_path
end
# .well-known was not created by user, removing to prevent confusion
if site.site_files_dataset.where(path: '.well-known').count == 0
begin
Dir.rmdir wellknown_path
rescue Errno::ENOTEMPTY, Errno::ENOENT
end
end
end
def active_certificate_covers?(site, domains)
return false if site.ssl_cert.blank?
certificate = OpenSSL::X509::Certificate.new site.ssl_cert
return false if certificate.not_after <= Time.now + CERT_RENEWAL_WINDOW
domains.all? do |domain|
certificate_names(certificate).any? {|name| certificate_name_matches_domain?(name, domain) }
end
rescue OpenSSL::X509::CertificateError
false
end
def certificate_names(certificate)
names = []
certificate.extensions.each do |extension|
next unless extension.oid == 'subjectAltName'
names.concat extension.value.split(',').map { |value|
value.strip[/\ADNS:(.+)\z/, 1]
}.compact
end
common_name = certificate.subject.to_a.find {|name, _, _| name == 'CN' }
names << common_name[1] if common_name
names.map(&:downcase).uniq
end
def certificate_name_matches_domain?(certificate_name, domain)
certificate_name = certificate_name.downcase
domain = domain.downcase
return true if certificate_name == domain
return false unless certificate_name.start_with?('*.')
suffix = certificate_name[1..]
domain.end_with?(suffix) && domain.count('.') == certificate_name.count('.')
end
def acme_rate_limited_until(domains)
retry_at = $redis.get(acme_rate_limit_key(domains)).to_f
return if retry_at <= Time.now.to_f
Time.at retry_at
end
def schedule_acme_rate_limited_retry(site, domains, retry_at)
retry_at ||= Time.now + 10.minutes
delay_seconds = [(retry_at - Time.now).ceil, 60].max
delay_seconds += rand(ACME_RATE_LIMIT_RETRY_JITTER.to_i)
key = acme_rate_limit_key domains
return unless $redis.set(key, retry_at.to_f, nx: true, ex: delay_seconds + 1.hour.to_i)
LetsEncryptWorker.perform_in delay_seconds, site.id
end
def acme_rate_limit_key(domains)
digest = Digest::SHA256.hexdigest domains.map(&:downcase).sort.join(',')
"#{ACME_RATE_LIMIT_KEY_PREFIX}:#{digest}"
end
end