cert-manager-webhook-sthome/pkg/util/wait.go

580 lines
17 KiB
Go

// +skip_license_check
/*
This file contains portions of code directly taken from the 'xenolf/lego' project.
A copy of the license for this code can be found in the file named LICENSE in
this directory.
*/
package util
import (
"bytes"
"context"
"fmt"
"io"
"net"
"net/http"
"strings"
"sync"
"time"
"github.com/miekg/dns"
klog "k8s.io/klog/v2"
//logf "github.com/cert-manager/cert-manager/pkg/logs"
)
type preCheckDNSFunc func(fqdn, value string, nameservers []string,
useAuthoritative bool) (bool, error)
type dnsQueryFunc func(fqdn string, rtype uint16, nameservers []string, recursive bool) (in *dns.Msg, err error)
var (
// PreCheckDNS checks DNS propagation before notifying ACME that
// the DNS challenge is ready.
PreCheckDNS preCheckDNSFunc = checkDNSPropagation
// dnsQuery is used to be able to mock DNSQuery
dnsQuery dnsQueryFunc = DNSQuery
fqdnToZoneLock sync.RWMutex
fqdnToZone = map[string]string{}
)
const defaultResolvConf = "/etc/resolv.conf"
const issueTag = "issue"
const issuewildTag = "issuewild"
var defaultNameservers = []string{
"8.8.8.8:53",
"8.8.4.4:53",
}
var RecursiveNameservers = getNameservers(defaultResolvConf, defaultNameservers)
// DNSTimeout is used to override the default DNS timeout of 10 seconds.
var DNSTimeout = 10 * time.Second
// getNameservers attempts to get systems nameservers before falling back to the defaults
func getNameservers(path string, defaults []string) []string {
config, err := dns.ClientConfigFromFile(path)
if err != nil || len(config.Servers) == 0 {
return defaults
}
systemNameservers := []string{}
for _, server := range config.Servers {
// ensure all servers have a port number
if _, _, err := net.SplitHostPort(server); err != nil {
systemNameservers = append(systemNameservers, net.JoinHostPort(server, "53"))
} else {
systemNameservers = append(systemNameservers, server)
}
}
return systemNameservers
}
// Follows the CNAME records and returns the last non-CNAME fully qualified domain name
// that it finds. Returns an error when a loop is found in the CNAME chain. The
// argument fqdnChain is used by the function itself to keep track of which fqdns it
// already encountered and detect loops.
func followCNAMEs(fqdn string, nameservers []string, fqdnChain ...string) (string, error) {
r, err := dnsQuery(fqdn, dns.TypeCNAME, nameservers, true)
if err != nil {
return "", err
}
if r.Rcode != dns.RcodeSuccess {
return fqdn, err
}
for _, rr := range r.Answer {
cn, ok := rr.(*dns.CNAME)
if !ok || cn.Hdr.Name != fqdn {
continue
}
klog.Infof("Updating FQDN: %s with its CNAME: %s", fqdn, cn.Target)
// Check if we were here before to prevent loops in the chain of CNAME records.
for _, fqdnInChain := range fqdnChain {
if cn.Target != fqdnInChain {
continue
}
return "", fmt.Errorf("found recursive CNAME record to %q when looking up %q", cn.Target, fqdn)
}
return followCNAMEs(cn.Target, nameservers, append(fqdnChain, fqdn)...)
}
return fqdn, nil
}
// checkDNSPropagation checks if the expected TXT record has been propagated to all authoritative nameservers.
func checkDNSPropagation(fqdn, value string, nameservers []string,
useAuthoritative bool) (bool, error) {
var err error
fqdn, err = followCNAMEs(fqdn, nameservers)
//klog.Infof("PreCheckDNS: followCNAMEs returned fqdn: %s, err: %s", fqdn, err)
if err != nil {
return false, err
}
if !useAuthoritative {
var success bool
success, err = checkAuthoritativeNss(fqdn, value, nameservers)
//klog.Infof("PreCheckDNS: returned success: %t, err: %s", success, err)
return success, err
}
authoritativeNss, err := lookupNameservers(fqdn, nameservers)
//klog.Infof("PreCheckDNS: lookupNameservers returned authoritativeNss: %s, err: %s", authoritativeNss, err)
if err != nil {
return false, err
}
for i, ans := range authoritativeNss {
authoritativeNss[i] = net.JoinHostPort(ans, "53")
}
return checkAuthoritativeNss(fqdn, value, authoritativeNss)
}
// checkAuthoritativeNss queries each of the given nameservers for the expected TXT record.
func checkAuthoritativeNss(fqdn, value string, nameservers []string) (bool, error) {
for _, ns := range nameservers {
klog.Infof("================== NS: %s ==================", ns)
r, err := DNSQuery(fqdn, dns.TypeTXT, []string{ns}, true)
//klog.Infof("DNSQuery returned \nr: %s, \nerr: %s", r, err)
if err != nil {
klog.Infof("DNSQuery failed, err: %s", err)
return false, err
}
klog.Infof("DNSQuery succeeded with r.Rcode: %d", r.Rcode)
// NXDomain response is not really an error, just waiting for propagation to happen
if !(r.Rcode == dns.RcodeSuccess || r.Rcode == dns.RcodeNameError) {
//klog.Errorf("NS %s returned %s for %s", ns, dns.RcodeToString[r.Rcode], fqdn)
return false, fmt.Errorf("NS %s returned %s for %s", ns, dns.RcodeToString[r.Rcode], fqdn)
}
klog.Infof("%q: must be %s", fqdn, value)
//klog.Infof("r.Answer: %s", r.Answer)
var found bool
var i = 0
for _, rr := range r.Answer {
i++
//txt1, ok1 := rr.(*dns.TXT)
//klog.Infof("Compare[%d]: ok: %t, query: %s, value: %s", i, ok1, strings.Join(txt1.Txt, ""), value)
if txt, ok := rr.(*dns.TXT); ok {
klog.Infof("Compare[%d]: Q: %s, A: %s", i, value, strings.Join(txt.Txt, ""))
if strings.Join(txt.Txt, "") == value {
found = true
break
}
}
}
if !found {
return false, nil
}
}
klog.Infof("Selfchecking using the DNS Lookup method was successful")
return true, nil
}
// DNSQuery will query a nameserver, iterating through the supplied servers as it retries
// The nameserver should include a port, to facilitate testing where we talk to a mock dns server.
func DNSQuery(fqdn string, rtype uint16, nameservers []string, recursive bool) (in *dns.Msg, err error) {
switch rtype {
case dns.TypeCAA, dns.TypeCNAME, dns.TypeNS, dns.TypeSOA, dns.TypeTXT:
default:
// We explicitly specified here what types are supported, so we can more confidently create tests for this function.
return nil, fmt.Errorf("unsupported DNS record type %d", rtype)
}
m := new(dns.Msg)
m.SetQuestion(fqdn, rtype)
m.SetEdns0(4096, false)
if !recursive {
m.RecursionDesired = false
}
udp := &dns.Client{Net: "udp", Timeout: DNSTimeout}
tcp := &dns.Client{Net: "tcp", Timeout: DNSTimeout}
httpClient := *http.DefaultClient
httpClient.Timeout = DNSTimeout
http := httpDNSClient{
HTTPClient: &httpClient,
}
// Will retry the request based on the number of servers (n+1)
for _, ns := range nameservers {
// If the TCP request succeeds, the err will reset to nil
if strings.HasPrefix(ns, "https://") {
in, _, err = http.Exchange(context.TODO(), m, ns)
} else {
in, _, err = udp.Exchange(m, ns)
// Try TCP if UDP fails
if (in != nil && in.Truncated) ||
(err != nil && strings.HasPrefix(err.Error(), "read udp") && strings.HasSuffix(err.Error(), "i/o timeout")) {
klog.Infof("UDP dns lookup failed, retrying with TCP: %v", err)
// If the TCP request succeeds, the err will reset to nil
in, _, err = tcp.Exchange(m, ns)
}
}
if err == nil {
break
}
}
return
}
type httpDNSClient struct {
HTTPClient *http.Client
}
const dohMimeType = "application/dns-message"
func (c *httpDNSClient) Exchange(ctx context.Context, m *dns.Msg, a string) (r *dns.Msg, rtt time.Duration, err error) {
p, err := m.Pack()
if err != nil {
return nil, 0, err
}
req, err := http.NewRequest(http.MethodPost, a, bytes.NewReader(p))
if err != nil {
return nil, 0, err
}
req.Header.Set("Content-Type", dohMimeType)
req.Header.Set("Accept", dohMimeType)
hc := http.DefaultClient
if c.HTTPClient != nil {
hc = c.HTTPClient
}
req = req.WithContext(ctx)
t := time.Now()
resp, err := hc.Do(req)
if err != nil {
return nil, 0, err
}
defer resp.Body.Close()
if resp.StatusCode != http.StatusOK {
return nil, 0, fmt.Errorf("dns: server returned HTTP %d error: %q", resp.StatusCode, resp.Status)
}
if ct := resp.Header.Get("Content-Type"); ct != dohMimeType {
return nil, 0, fmt.Errorf("dns: unexpected Content-Type %q; expected %q", ct, dohMimeType)
}
p, err = io.ReadAll(resp.Body)
if err != nil {
return nil, 0, err
}
rtt = time.Since(t)
r = new(dns.Msg)
if err := r.Unpack(p); err != nil {
return r, 0, err
}
return r, rtt, nil
}
func ValidateCAA(domain string, issuerID []string, iswildcard bool, nameservers []string) error {
// see https://tools.ietf.org/html/rfc6844#section-4
// for more information about how CAA lookup is performed
fqdn := ToFqdn(domain)
issuerSet := make(map[string]bool)
for _, s := range issuerID {
issuerSet[s] = true
}
var caas []*dns.CAA
for {
// follow at most 8 cnames per label
queryDomain := fqdn
var msg *dns.Msg
var err error
for i := 0; i < 8; i++ {
// usually, we should be able to just ask the local recursive
// nameserver for CAA records, but some setups will return SERVFAIL
// on unknown types like CAA. Instead, ask the authoritative server
var authNS []string
authNS, err = lookupNameservers(queryDomain, nameservers)
if err != nil {
return fmt.Errorf("could not validate CAA record: %s", err)
}
for i, ans := range authNS {
authNS[i] = net.JoinHostPort(ans, "53")
}
msg, err = DNSQuery(queryDomain, dns.TypeCAA, authNS, false)
if err != nil {
return fmt.Errorf("could not validate CAA record: %s", err)
}
// domain may not exist, which is fine. It will fail HTTP01 checks
// but DNS01 checks will create a proper domain
if msg.Rcode == dns.RcodeNameError {
break
}
if msg.Rcode != dns.RcodeSuccess {
return fmt.Errorf("could not validate CAA: Unexpected response code '%s' for %s",
dns.RcodeToString[msg.Rcode], domain)
}
oldQuery := queryDomain
queryDomain, err := followCNAMEs(queryDomain, nameservers)
if err != nil {
return fmt.Errorf("while trying to follow CNAMEs for domain %s using nameservers %v: %w", queryDomain, nameservers, err)
}
if queryDomain == oldQuery {
break
}
}
// we have a response that's not a CNAME. It might be empty.
// if it is, go up a label and ask again
for _, rr := range msg.Answer {
caa, ok := rr.(*dns.CAA)
if !ok {
continue
}
caas = append(caas, caa)
}
// once we've found any CAA records, we use these CAAs
if len(caas) != 0 {
break
}
index := strings.Index(fqdn, ".")
if index == -1 {
panic("should never happen")
}
fqdn = fqdn[index+1:]
if len(fqdn) == 0 {
// we reached the root with no CAA, don't bother asking
return nil
}
}
if !matchCAA(caas, issuerSet, iswildcard) {
// TODO(dmo): better error message
return fmt.Errorf("CAA record does not match issuer")
}
return nil
}
func matchCAA(caas []*dns.CAA, issuerIDs map[string]bool, iswildcard bool) bool {
matches := false
for _, caa := range caas {
// if we require a wildcard certificate, we must prioritize any issuewild
// tags - only if it matches (regardless of any other entries) can we
// issue a wildcard certificate
if iswildcard && caa.Tag == issuewildTag {
return issuerIDs[caa.Value]
}
// issue tags allow any certificate, we perform a check which will only
// be returned if we do not need a wildcard certificate, or if we need
// a wildcard certificate and no issuewild entries are present
if caa.Tag == issueTag {
matches = matches || issuerIDs[caa.Value]
}
}
return matches
}
// lookupNameservers returns the authoritative nameservers for the given fqdn.
func lookupNameservers(fqdn string, nameservers []string) ([]string, error) {
var authoritativeNss []string
//klog.Infof("Searching fqdn %q using seed nameservers [%s]", fqdn, strings.Join(nameservers, ", "))
klog.Infof("Searching fqdn %q", fqdn)
zone, err := FindZoneByFqdn(fqdn, nameservers)
if err != nil {
return nil, fmt.Errorf("could not determine the zone for %q: %v", fqdn, err)
}
r, err := DNSQuery(zone, dns.TypeNS, nameservers, true)
if err != nil {
return nil, err
}
for _, rr := range r.Answer {
if ns, ok := rr.(*dns.NS); ok {
authoritativeNss = append(authoritativeNss, strings.ToLower(ns.Ns))
}
}
if len(authoritativeNss) > 0 {
//klog.Infof("Returning authoritative nameservers [%s]", strings.Join(authoritativeNss, ", "))
return authoritativeNss, nil
}
return nil, fmt.Errorf("could not determine authoritative nameservers for %q", fqdn)
}
// FindZoneByFqdn determines the zone apex for the given fqdn by recursing up the
// domain labels until the nameserver returns a SOA record in the answer section.
func FindZoneByFqdn(fqdn string, nameservers []string) (string, error) {
fqdnToZoneLock.RLock()
// Do we have it cached?
if zone, ok := fqdnToZone[fqdn]; ok {
fqdnToZoneLock.RUnlock()
klog.Infof("Return zone %q for %q", zone, fqdn)
return zone, nil
}
fqdnToZoneLock.RUnlock()
labelIndexes := dns.Split(fqdn)
// We are climbing up the domain tree, looking for the SOA record on
// one of them. For example, imagine that the DNS tree looks like this:
//
// example.com. ← SOA is here.
// └── foo.example.com.
// └── _acme-challenge.foo.example.com. ← Starting point.
//
// We start at the bottom of the tree and climb up. The NXDOMAIN error
// lets us know that we should climb higher:
//
// _acme-challenge.foo.example.com. returns NXDOMAIN
// foo.example.com. returns NXDOMAIN
// example.com. returns NOERROR along with the SOA
for _, index := range labelIndexes {
domain := fqdn[index:]
in, err := DNSQuery(domain, dns.TypeSOA, nameservers, true)
if err != nil {
return "", err
}
// NXDOMAIN tells us that we did not climb far enough up the DNS tree. We
// thus continue climbing to find the SOA record.
if in.Rcode == dns.RcodeNameError {
continue
}
// Any non-successful response code, other than NXDOMAIN, is treated as an error
// and interrupts the search.
if in.Rcode != dns.RcodeSuccess {
return "", fmt.Errorf("when querying the SOA record for the domain '%s' using nameservers %v, rcode was expected to be 'NOERROR' or 'NXDOMAIN', but got '%s'",
domain, nameservers, dns.RcodeToString[in.Rcode])
}
// As per RFC 2181, CNAME records cannot not exist at the root of a zone,
// which means we won't be finding any SOA record for this domain.
if dnsMsgContainsCNAME(in) {
continue
}
for _, ans := range in.Answer {
if soa, ok := ans.(*dns.SOA); ok {
fqdnToZoneLock.Lock()
defer fqdnToZoneLock.Unlock()
zone := soa.Hdr.Name
fqdnToZone[fqdn] = zone
klog.Infof("Zone record %q for fqdn %q", zone, fqdn)
return zone, nil
}
}
}
return "", fmt.Errorf("could not find the SOA record in the DNS tree for the domain '%s' using nameservers %v", fqdn, nameservers)
}
// dnsMsgContainsCNAME checks for a CNAME answer in msg
func dnsMsgContainsCNAME(msg *dns.Msg) bool {
for _, ans := range msg.Answer {
if _, ok := ans.(*dns.CNAME); ok {
return true
}
}
return false
}
// ToFqdn converts the name into a fqdn appending a trailing dot.
func ToFqdn(name string) string {
n := len(name)
if n == 0 || name[n-1] == '.' {
return name
}
return name + "."
}
// UnFqdn converts the fqdn into a name removing the trailing dot.
func UnFqdn(name string) string {
n := len(name)
if n != 0 && name[n-1] == '.' {
return name[:n-1]
}
return name
}
// WaitFor polls the given function 'f', once every 'interval', up to 'timeout'.
func WaitFor(timeout, interval time.Duration, f func() (bool, error)) error {
var lastErr string
timeup := time.After(timeout)
for {
select {
case <-timeup:
return fmt.Errorf("time limit exceeded. Last error: %s", lastErr)
default:
}
stop, err := f()
if stop {
return nil
}
if err != nil {
lastErr = err.Error()
}
time.Sleep(interval)
}
}
// DNS01LookupFQDN returns a DNS name which will be updated to solve the dns-01
// challenge
// TODO: move this into the pkg/acme package
func DNS01LookupFQDN(domain string, followCNAME bool, nameservers ...string) (string, error) {
fqdn := fmt.Sprintf("_acme-challenge.%s.", domain)
// Check if the domain has CNAME then return that
if followCNAME {
var err error
fqdn, err = followCNAMEs(fqdn, nameservers)
if err != nil {
return "", err
}
}
return fqdn, nil
}
// FindBestMatch returns the longest match for a given domain within a list of domains
func FindBestMatch(query string, domains ...string) (string, error) {
var maxSoFar int
var longest string
for _, domain := range domains {
if query == domain {
// Found exact match
return domain, nil
}
maxHere := dns.CompareDomainName(query, domain)
if maxHere > maxSoFar && dns.IsSubDomain(domain, query) {
maxSoFar = maxHere
longest = domain
}
}
if len(longest) == 0 {
return "", fmt.Errorf("query: %v has no matches", query)
}
return longest, nil
}