Платформа ЦРНП "Мирокод" для разработки проектов
https://git.mirocod.ru
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
573 lines
20 KiB
573 lines
20 KiB
// Copyright 2015 Matthew Holt |
|
// |
|
// Licensed under the Apache License, Version 2.0 (the "License"); |
|
// you may not use this file except in compliance with the License. |
|
// You may obtain a copy of the License at |
|
// |
|
// http://www.apache.org/licenses/LICENSE-2.0 |
|
// |
|
// Unless required by applicable law or agreed to in writing, software |
|
// distributed under the License is distributed on an "AS IS" BASIS, |
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
|
// See the License for the specific language governing permissions and |
|
// limitations under the License. |
|
|
|
package certmagic |
|
|
|
import ( |
|
"context" |
|
"crypto/tls" |
|
"encoding/json" |
|
"fmt" |
|
"net" |
|
"strings" |
|
"sync" |
|
"time" |
|
|
|
"github.com/mholt/acmez" |
|
"github.com/mholt/acmez/acme" |
|
"go.uber.org/zap" |
|
) |
|
|
|
// GetCertificate gets a certificate to satisfy clientHello. In getting |
|
// the certificate, it abides the rules and settings defined in the |
|
// Config that matches clientHello.ServerName. It first checks the in- |
|
// memory cache, then, if the config enables "OnDemand", it accesses |
|
// disk, then accesses the network if it must obtain a new certificate |
|
// via ACME. |
|
// |
|
// This method is safe for use as a tls.Config.GetCertificate callback. |
|
func (cfg *Config) GetCertificate(clientHello *tls.ClientHelloInfo) (*tls.Certificate, error) { |
|
cfg.emit("tls_handshake_started", clientHello) |
|
|
|
// special case: serve up the certificate for a TLS-ALPN ACME challenge |
|
// (https://tools.ietf.org/html/draft-ietf-acme-tls-alpn-05) |
|
for _, proto := range clientHello.SupportedProtos { |
|
if proto == acmez.ACMETLS1Protocol { |
|
cfg.certCache.mu.RLock() |
|
challengeCert, ok := cfg.certCache.cache[tlsALPNCertKeyName(clientHello.ServerName)] |
|
cfg.certCache.mu.RUnlock() |
|
if !ok { |
|
// see if this challenge was started in a cluster; try distributed challenge solver |
|
// (note that the tls.Config's ALPN settings must include the ACME TLS-ALPN challenge |
|
// protocol string, otherwise a valid certificate will not solve the challenge; we |
|
// should already have taken care of that when we made the tls.Config) |
|
challengeCert, ok, err := cfg.tryDistributedChallengeSolver(clientHello) |
|
if err != nil { |
|
if cfg.Logger != nil { |
|
cfg.Logger.Error("tls-alpn challenge", |
|
zap.String("server_name", clientHello.ServerName), |
|
zap.Error(err)) |
|
} |
|
} |
|
if ok { |
|
if cfg.Logger != nil { |
|
cfg.Logger.Info("served key authentication certificate", |
|
zap.String("server_name", clientHello.ServerName), |
|
zap.String("challenge", "tls-alpn-01"), |
|
zap.String("remote", clientHello.Conn.RemoteAddr().String()), |
|
zap.Bool("distributed", true)) |
|
} |
|
return &challengeCert.Certificate, nil |
|
} |
|
return nil, fmt.Errorf("no certificate to complete TLS-ALPN challenge for SNI name: %s", clientHello.ServerName) |
|
} |
|
if cfg.Logger != nil { |
|
cfg.Logger.Info("served key authentication certificate", |
|
zap.String("server_name", clientHello.ServerName), |
|
zap.String("challenge", "tls-alpn-01"), |
|
zap.String("remote", clientHello.Conn.RemoteAddr().String())) |
|
} |
|
return &challengeCert.Certificate, nil |
|
} |
|
} |
|
|
|
// get the certificate and serve it up |
|
cert, err := cfg.getCertDuringHandshake(clientHello, true, true) |
|
if err == nil { |
|
cfg.emit("tls_handshake_completed", clientHello) |
|
} |
|
return &cert.Certificate, err |
|
} |
|
|
|
// getCertificate gets a certificate that matches name from the in-memory |
|
// cache, according to the lookup table associated with cfg. The lookup then |
|
// points to a certificate in the Instance certificate cache. |
|
// |
|
// The name is expected to already be normalized (e.g. lowercased). |
|
// |
|
// If there is no exact match for name, it will be checked against names of |
|
// the form '*.example.com' (wildcard certificates) according to RFC 6125. |
|
// If a match is found, matched will be true. If no matches are found, matched |
|
// will be false and a "default" certificate will be returned with defaulted |
|
// set to true. If defaulted is false, then no certificates were available. |
|
// |
|
// The logic in this function is adapted from the Go standard library, |
|
// which is by the Go Authors. |
|
// |
|
// This function is safe for concurrent use. |
|
func (cfg *Config) getCertificate(hello *tls.ClientHelloInfo) (cert Certificate, matched, defaulted bool) { |
|
name := NormalizedName(hello.ServerName) |
|
|
|
if name == "" { |
|
// if SNI is empty, prefer matching IP address |
|
if hello.Conn != nil { |
|
addr := hello.Conn.LocalAddr().String() |
|
ip, _, err := net.SplitHostPort(addr) |
|
if err == nil { |
|
addr = ip |
|
} |
|
cert, matched = cfg.selectCert(hello, addr) |
|
if matched { |
|
return |
|
} |
|
} |
|
|
|
// fall back to a "default" certificate, if specified |
|
if cfg.DefaultServerName != "" { |
|
normDefault := NormalizedName(cfg.DefaultServerName) |
|
cert, defaulted = cfg.selectCert(hello, normDefault) |
|
if defaulted { |
|
return |
|
} |
|
} |
|
} else { |
|
// if SNI is specified, try an exact match first |
|
cert, matched = cfg.selectCert(hello, name) |
|
if matched { |
|
return |
|
} |
|
|
|
// try replacing labels in the name with |
|
// wildcards until we get a match |
|
labels := strings.Split(name, ".") |
|
for i := range labels { |
|
labels[i] = "*" |
|
candidate := strings.Join(labels, ".") |
|
cert, matched = cfg.selectCert(hello, candidate) |
|
if matched { |
|
return |
|
} |
|
} |
|
|
|
// check the certCache directly to see if the SNI name is |
|
// already the key of the certificate it wants; this implies |
|
// that the SNI can contain the hash of a specific cert |
|
// (chain) it wants and we will still be able to serve it up |
|
// (this behavior, by the way, could be controversial as to |
|
// whether it complies with RFC 6066 about SNI, but I think |
|
// it does, soooo...) |
|
// (this is how we solved the former ACME TLS-SNI challenge) |
|
cfg.certCache.mu.RLock() |
|
directCert, ok := cfg.certCache.cache[name] |
|
cfg.certCache.mu.RUnlock() |
|
if ok { |
|
cert = directCert |
|
matched = true |
|
return |
|
} |
|
} |
|
|
|
// otherwise, we're bingo on ammo; see issues |
|
// caddyserver/caddy#2035 and caddyserver/caddy#1303 (any |
|
// change to certificate matching behavior must |
|
// account for hosts defined where the hostname |
|
// is empty or a catch-all, like ":443" or |
|
// "0.0.0.0:443") |
|
|
|
return |
|
} |
|
|
|
// selectCert uses hello to select a certificate from the |
|
// cache for name. If cfg.CertSelection is set, it will be |
|
// used to make the decision. Otherwise, the first matching |
|
// unexpired cert is returned. As a special case, if no |
|
// certificates match name and cfg.CertSelection is set, |
|
// then all certificates in the cache will be passed in |
|
// for the cfg.CertSelection to make the final decision. |
|
func (cfg *Config) selectCert(hello *tls.ClientHelloInfo, name string) (Certificate, bool) { |
|
choices := cfg.certCache.getAllMatchingCerts(name) |
|
if len(choices) == 0 { |
|
if cfg.CertSelection == nil { |
|
return Certificate{}, false |
|
} |
|
choices = cfg.certCache.getAllCerts() |
|
} |
|
if cfg.CertSelection == nil { |
|
cert, err := DefaultCertificateSelector(hello, choices) |
|
return cert, err == nil |
|
} |
|
cert, err := cfg.CertSelection.SelectCertificate(hello, choices) |
|
return cert, err == nil |
|
} |
|
|
|
// DefaultCertificateSelector is the default certificate selection logic |
|
// given a choice of certificates. If there is at least one certificate in |
|
// choices, it always returns a certificate without error. It chooses the |
|
// first non-expired certificate that the client supports if possible, |
|
// otherwise it returns an expired certificate that the client supports, |
|
// otherwise it just returns the first certificate in the list of choices. |
|
func DefaultCertificateSelector(hello *tls.ClientHelloInfo, choices []Certificate) (Certificate, error) { |
|
if len(choices) == 0 { |
|
return Certificate{}, fmt.Errorf("no certificates available") |
|
} |
|
now := time.Now() |
|
best := choices[0] |
|
for _, choice := range choices { |
|
if err := hello.SupportsCertificate(&choice.Certificate); err != nil { |
|
continue |
|
} |
|
best = choice // at least the client supports it... |
|
if now.After(choice.Leaf.NotBefore) && now.Before(choice.Leaf.NotAfter) { |
|
return choice, nil // ...and unexpired, great! "Certificate, I choose you!" |
|
} |
|
} |
|
return best, nil // all matching certs are expired or incompatible, oh well |
|
} |
|
|
|
// getCertDuringHandshake will get a certificate for hello. It first tries |
|
// the in-memory cache. If no certificate for hello is in the cache, the |
|
// config most closely corresponding to hello will be loaded. If that config |
|
// allows it (OnDemand==true) and if loadIfNecessary == true, it goes to disk |
|
// to load it into the cache and serve it. If it's not on disk and if |
|
// obtainIfNecessary == true, the certificate will be obtained from the CA, |
|
// cached, and served. If obtainIfNecessary is true, then loadIfNecessary |
|
// must also be set to true. An error will be returned if and only if no |
|
// certificate is available. |
|
// |
|
// This function is safe for concurrent use. |
|
func (cfg *Config) getCertDuringHandshake(hello *tls.ClientHelloInfo, loadIfNecessary, obtainIfNecessary bool) (Certificate, error) { |
|
log := loggerNamed(cfg.Logger, "on_demand") |
|
|
|
// First check our in-memory cache to see if we've already loaded it |
|
cert, matched, defaulted := cfg.getCertificate(hello) |
|
if matched { |
|
if cert.managed && cfg.OnDemand != nil && obtainIfNecessary { |
|
// It's been reported before that if the machine goes to sleep (or |
|
// suspends the process) that certs which are already loaded into |
|
// memory won't get renewed in the background, so we need to check |
|
// expiry on each handshake too, sigh: |
|
// https://caddy.community/t/local-certificates-not-renewing-on-demand/9482 |
|
return cfg.optionalMaintenance(log, cert, hello) |
|
} |
|
return cert, nil |
|
} |
|
|
|
name := cfg.getNameFromClientHello(hello) |
|
|
|
// If OnDemand is enabled, then we might be able to load or |
|
// obtain a needed certificate |
|
if cfg.OnDemand != nil && loadIfNecessary { |
|
// Then check to see if we have one on disk |
|
loadedCert, err := cfg.CacheManagedCertificate(name) |
|
if err == nil { |
|
loadedCert, err = cfg.handshakeMaintenance(hello, loadedCert) |
|
if err != nil { |
|
if log != nil { |
|
log.Error("maintining newly-loaded certificate", |
|
zap.String("server_name", name), |
|
zap.Error(err)) |
|
} |
|
} |
|
return loadedCert, nil |
|
} |
|
if obtainIfNecessary { |
|
// By this point, we need to ask the CA for a certificate |
|
|
|
// Make sure the certificate should be obtained based on config |
|
err := cfg.checkIfCertShouldBeObtained(name) |
|
if err != nil { |
|
return Certificate{}, err |
|
} |
|
|
|
// Obtain certificate from the CA |
|
return cfg.obtainOnDemandCertificate(hello) |
|
} |
|
} |
|
|
|
// Fall back to the default certificate if there is one |
|
if defaulted { |
|
return cert, nil |
|
} |
|
|
|
return Certificate{}, fmt.Errorf("no certificate available for '%s'", name) |
|
} |
|
|
|
// optionalMaintenance will perform maintenance on the certificate (if necessary) and |
|
// will return the resulting certificate. This should only be done if the certificate |
|
// is managed, OnDemand is enabled, and the scope is allowed to obtain certificates. |
|
func (cfg *Config) optionalMaintenance(log *zap.Logger, cert Certificate, hello *tls.ClientHelloInfo) (Certificate, error) { |
|
newCert, err := cfg.handshakeMaintenance(hello, cert) |
|
if err == nil { |
|
return newCert, nil |
|
} |
|
|
|
if log != nil { |
|
log.Error("renewing certificate on-demand failed", |
|
zap.Strings("subjects", cert.Names), |
|
zap.Time("not_after", cert.Leaf.NotAfter), |
|
zap.Error(err)) |
|
} |
|
|
|
if cert.Expired() { |
|
return cert, err |
|
} |
|
|
|
// still has time remaining, so serve it anyway |
|
return cert, nil |
|
} |
|
|
|
// checkIfCertShouldBeObtained checks to see if an on-demand TLS certificate |
|
// should be obtained for a given domain based upon the config settings. If |
|
// a non-nil error is returned, do not issue a new certificate for name. |
|
func (cfg *Config) checkIfCertShouldBeObtained(name string) error { |
|
if cfg.OnDemand == nil { |
|
return fmt.Errorf("not configured for on-demand certificate issuance") |
|
} |
|
if !SubjectQualifiesForCert(name) { |
|
return fmt.Errorf("subject name does not qualify for certificate: %s", name) |
|
} |
|
if cfg.OnDemand.DecisionFunc != nil { |
|
return cfg.OnDemand.DecisionFunc(name) |
|
} |
|
if len(cfg.OnDemand.hostWhitelist) > 0 && |
|
!cfg.OnDemand.whitelistContains(name) { |
|
return fmt.Errorf("certificate for '%s' is not managed", name) |
|
} |
|
return nil |
|
} |
|
|
|
// obtainOnDemandCertificate obtains a certificate for hello. |
|
// If another goroutine has already started obtaining a cert for |
|
// hello, it will wait and use what the other goroutine obtained. |
|
// |
|
// This function is safe for use by multiple concurrent goroutines. |
|
func (cfg *Config) obtainOnDemandCertificate(hello *tls.ClientHelloInfo) (Certificate, error) { |
|
log := loggerNamed(cfg.Logger, "on_demand") |
|
|
|
name := cfg.getNameFromClientHello(hello) |
|
|
|
// We must protect this process from happening concurrently, so synchronize. |
|
obtainCertWaitChansMu.Lock() |
|
wait, ok := obtainCertWaitChans[name] |
|
if ok { |
|
// lucky us -- another goroutine is already obtaining the certificate. |
|
// wait for it to finish obtaining the cert and then we'll use it. |
|
obtainCertWaitChansMu.Unlock() |
|
<-wait |
|
return cfg.getCertDuringHandshake(hello, true, false) |
|
} |
|
|
|
// looks like it's up to us to do all the work and obtain the cert. |
|
// make a chan others can wait on if needed |
|
wait = make(chan struct{}) |
|
obtainCertWaitChans[name] = wait |
|
obtainCertWaitChansMu.Unlock() |
|
|
|
// obtain the certificate |
|
if log != nil { |
|
log.Info("obtaining new certificate", zap.String("server_name", name)) |
|
} |
|
// TODO: use a proper context; we use one with timeout because retries are enabled because interactive is false |
|
ctx, cancel := context.WithTimeout(context.TODO(), 90*time.Second) |
|
defer cancel() |
|
err := cfg.ObtainCert(ctx, name, false) |
|
|
|
// immediately unblock anyone waiting for it; doing this in |
|
// a defer would risk deadlock because of the recursive call |
|
// to getCertDuringHandshake below when we return! |
|
obtainCertWaitChansMu.Lock() |
|
close(wait) |
|
delete(obtainCertWaitChans, name) |
|
obtainCertWaitChansMu.Unlock() |
|
|
|
if err != nil { |
|
// shucks; failed to solve challenge on-demand |
|
return Certificate{}, err |
|
} |
|
|
|
// success; certificate was just placed on disk, so |
|
// we need only restart serving the certificate |
|
return cfg.getCertDuringHandshake(hello, true, false) |
|
} |
|
|
|
// handshakeMaintenance performs a check on cert for expiration and OCSP validity. |
|
// If necessary, it will renew the certificate and/or refresh the OCSP staple. |
|
// OCSP stapling errors are not returned, only logged. |
|
// |
|
// This function is safe for use by multiple concurrent goroutines. |
|
func (cfg *Config) handshakeMaintenance(hello *tls.ClientHelloInfo, cert Certificate) (Certificate, error) { |
|
log := loggerNamed(cfg.Logger, "on_demand") |
|
|
|
// Check cert expiration |
|
timeLeft := cert.Leaf.NotAfter.Sub(time.Now().UTC()) |
|
if currentlyInRenewalWindow(cert.Leaf.NotBefore, cert.Leaf.NotAfter, cfg.RenewalWindowRatio) { |
|
if log != nil { |
|
log.Info("certificate expires soon; attempting renewal", |
|
zap.Strings("identifiers", cert.Names), |
|
zap.Duration("remaining", timeLeft)) |
|
} |
|
return cfg.renewDynamicCertificate(hello, cert) |
|
} |
|
|
|
// Check OCSP staple validity |
|
if cert.ocsp != nil { |
|
refreshTime := cert.ocsp.ThisUpdate.Add(cert.ocsp.NextUpdate.Sub(cert.ocsp.ThisUpdate) / 2) |
|
if time.Now().After(refreshTime) { |
|
_, err := stapleOCSP(cfg.Storage, &cert, nil) |
|
if err != nil { |
|
// An error with OCSP stapling is not the end of the world, and in fact, is |
|
// quite common considering not all certs have issuer URLs that support it. |
|
if log != nil { |
|
log.Warn("stapling OCSP", |
|
zap.String("server_name", hello.ServerName), |
|
zap.Error(err)) |
|
} |
|
} |
|
cfg.certCache.mu.Lock() |
|
cfg.certCache.cache[cert.hash] = cert |
|
cfg.certCache.mu.Unlock() |
|
} |
|
} |
|
|
|
return cert, nil |
|
} |
|
|
|
// renewDynamicCertificate renews the certificate for name using cfg. It returns the |
|
// certificate to use and an error, if any. name should already be lower-cased before |
|
// calling this function. name is the name obtained directly from the handshake's |
|
// ClientHello. |
|
// |
|
// This function is safe for use by multiple concurrent goroutines. |
|
func (cfg *Config) renewDynamicCertificate(hello *tls.ClientHelloInfo, currentCert Certificate) (Certificate, error) { |
|
log := loggerNamed(cfg.Logger, "on_demand") |
|
|
|
name := cfg.getNameFromClientHello(hello) |
|
|
|
obtainCertWaitChansMu.Lock() |
|
wait, ok := obtainCertWaitChans[name] |
|
if ok { |
|
// lucky us -- another goroutine is already renewing the certificate. |
|
// wait for it to finish, then we'll use the new one. |
|
obtainCertWaitChansMu.Unlock() |
|
<-wait |
|
return cfg.getCertDuringHandshake(hello, true, false) |
|
} |
|
|
|
// looks like it's up to us to do all the work and renew the cert |
|
wait = make(chan struct{}) |
|
obtainCertWaitChans[name] = wait |
|
obtainCertWaitChansMu.Unlock() |
|
|
|
// Make sure a certificate for this name should be obtained on-demand |
|
err := cfg.checkIfCertShouldBeObtained(name) |
|
if err != nil { |
|
// if not, remove from cache (it will be deleted from storage later) |
|
cfg.certCache.mu.Lock() |
|
cfg.certCache.removeCertificate(currentCert) |
|
cfg.certCache.mu.Unlock() |
|
return Certificate{}, err |
|
} |
|
|
|
// renew and reload the certificate |
|
if log != nil { |
|
log.Info("renewing certificate", zap.String("server_name", name)) |
|
} |
|
// TODO: use a proper context; we use one with timeout because retries are enabled because interactive is false |
|
ctx, cancel := context.WithTimeout(context.TODO(), 90*time.Second) |
|
defer cancel() |
|
err = cfg.RenewCert(ctx, name, false) |
|
if err == nil { |
|
// even though the recursive nature of the dynamic cert loading |
|
// would just call this function anyway, we do it here to |
|
// make the replacement as atomic as possible. |
|
newCert, err := cfg.CacheManagedCertificate(name) |
|
if err != nil { |
|
if log != nil { |
|
log.Error("loading renewed certificate", zap.String("server_name", name), zap.Error(err)) |
|
} |
|
} else { |
|
// replace the old certificate with the new one |
|
cfg.certCache.replaceCertificate(currentCert, newCert) |
|
} |
|
} |
|
|
|
// immediately unblock anyone waiting for it; doing this in |
|
// a defer would risk deadlock because of the recursive call |
|
// to getCertDuringHandshake below when we return! |
|
obtainCertWaitChansMu.Lock() |
|
close(wait) |
|
delete(obtainCertWaitChans, name) |
|
obtainCertWaitChansMu.Unlock() |
|
|
|
if err != nil { |
|
return Certificate{}, err |
|
} |
|
|
|
return cfg.getCertDuringHandshake(hello, true, false) |
|
} |
|
|
|
// tryDistributedChallengeSolver is to be called when the clientHello pertains to |
|
// a TLS-ALPN challenge and a certificate is required to solve it. This method |
|
// checks the distributed store of challenge info files and, if a matching ServerName |
|
// is present, it makes a certificate to solve this challenge and returns it. For |
|
// this to succeed, it requires that cfg.Issuer is of type *ACMEManager. |
|
// A boolean true is returned if a valid certificate is returned. |
|
func (cfg *Config) tryDistributedChallengeSolver(clientHello *tls.ClientHelloInfo) (Certificate, bool, error) { |
|
am, ok := cfg.Issuer.(*ACMEManager) |
|
if !ok { |
|
return Certificate{}, false, nil |
|
} |
|
tokenKey := distributedSolver{acmeManager: am, caURL: am.CA}.challengeTokensKey(clientHello.ServerName) |
|
chalInfoBytes, err := cfg.Storage.Load(tokenKey) |
|
if err != nil { |
|
if _, ok := err.(ErrNotExist); ok { |
|
return Certificate{}, false, nil |
|
} |
|
return Certificate{}, false, fmt.Errorf("opening distributed challenge token file %s: %v", tokenKey, err) |
|
} |
|
|
|
var chalInfo acme.Challenge |
|
err = json.Unmarshal(chalInfoBytes, &chalInfo) |
|
if err != nil { |
|
return Certificate{}, false, fmt.Errorf("decoding challenge token file %s (corrupted?): %v", tokenKey, err) |
|
} |
|
|
|
cert, err := acmez.TLSALPN01ChallengeCert(chalInfo) |
|
if err != nil { |
|
return Certificate{}, false, fmt.Errorf("making TLS-ALPN challenge certificate: %v", err) |
|
} |
|
if cert == nil { |
|
return Certificate{}, false, fmt.Errorf("got nil TLS-ALPN challenge certificate but no error") |
|
} |
|
|
|
return Certificate{Certificate: *cert}, true, nil |
|
} |
|
|
|
// getNameFromClientHello returns a normalized form of hello.ServerName. |
|
// If hello.ServerName is empty (i.e. client did not use SNI), then the |
|
// associated connection's local address is used to extract an IP address. |
|
func (*Config) getNameFromClientHello(hello *tls.ClientHelloInfo) string { |
|
name := NormalizedName(hello.ServerName) |
|
if name != "" || hello.Conn == nil { |
|
return name |
|
} |
|
|
|
// if no SNI, try using IP address on the connection |
|
localAddr := hello.Conn.LocalAddr().String() |
|
localAddrHost, _, err := net.SplitHostPort(localAddr) |
|
if err == nil { |
|
return localAddrHost |
|
} |
|
return localAddr |
|
} |
|
|
|
// NormalizedName returns a cleaned form of serverName that is |
|
// used for consistency when referring to a SNI value. |
|
func NormalizedName(serverName string) string { |
|
return strings.ToLower(strings.TrimSpace(serverName)) |
|
} |
|
|
|
// obtainCertWaitChans is used to coordinate obtaining certs for each hostname. |
|
var obtainCertWaitChans = make(map[string]chan struct{}) |
|
var obtainCertWaitChansMu sync.Mutex
|
|
|