2022-06-10 11:32:08 -05:00
package nomad
import (
"context"
2022-09-19 16:26:08 +02:00
"errors"
2022-06-10 11:32:08 -05:00
"fmt"
"strings"
"text/template"
"time"
"github.com/cenkalti/backoff/v4"
"github.com/hashicorp/nomad/api"
2022-11-21 18:36:05 +01:00
"github.com/rs/zerolog/log"
2022-06-10 11:32:08 -05:00
ptypes "github.com/traefik/paerser/types"
2023-02-03 15:24:05 +01:00
"github.com/traefik/traefik/v3/pkg/config/dynamic"
"github.com/traefik/traefik/v3/pkg/job"
"github.com/traefik/traefik/v3/pkg/logs"
"github.com/traefik/traefik/v3/pkg/provider"
"github.com/traefik/traefik/v3/pkg/provider/constraints"
"github.com/traefik/traefik/v3/pkg/safe"
"github.com/traefik/traefik/v3/pkg/types"
2022-06-10 11:32:08 -05:00
)
const (
// providerName is the name of this provider.
providerName = "nomad"
// defaultTemplateRule is the default template for the default rule.
defaultTemplateRule = "Host(`{{ normalize .Name }}`)"
// defaultPrefix is the default prefix used in tag values indicating the service
// should be consumed and exposed via traefik.
defaultPrefix = "traefik"
)
var _ provider . Provider = ( * Provider ) ( nil )
type item struct {
ID string // service ID
Name string // service name
Namespace string // service namespace
Node string // node ID
Datacenter string // region
Address string // service address
Port int // service port
Tags [ ] string // service tags
ExtraConf configuration // global options
}
2023-03-22 12:00:25 +01:00
// configuration contains information from the service's tags that are globals
// (not specific to the dynamic configuration).
type configuration struct {
Enable bool // <prefix>.enable is the corresponding label.
Canary bool // <prefix>.nomad.canary is the corresponding label.
}
2022-09-19 16:26:08 +02:00
// ProviderBuilder is responsible for constructing namespaced instances of the Nomad provider.
type ProviderBuilder struct {
Configuration ` yaml:",inline" export:"true" `
Namespaces [ ] string ` description:"Sets the Nomad namespaces used to discover services." json:"namespaces,omitempty" toml:"namespaces,omitempty" yaml:"namespaces,omitempty" `
}
// BuildProviders builds Nomad provider instances for the given namespaces configuration.
func ( p * ProviderBuilder ) BuildProviders ( ) [ ] * Provider {
if len ( p . Namespaces ) == 0 {
return [ ] * Provider { {
Configuration : p . Configuration ,
name : providerName ,
} }
}
var providers [ ] * Provider
for _ , namespace := range p . Namespaces {
providers = append ( providers , & Provider {
Configuration : p . Configuration ,
name : providerName + "-" + namespace ,
namespace : namespace ,
} )
}
return providers
}
// Configuration represents the Nomad provider configuration.
type Configuration struct {
2024-04-04 05:54:04 -04:00
DefaultRule string ` description:"Default rule." json:"defaultRule,omitempty" toml:"defaultRule,omitempty" yaml:"defaultRule,omitempty" `
Constraints string ` description:"Constraints is an expression that Traefik matches against the Nomad service's tags to determine whether to create route(s) for that service." json:"constraints,omitempty" toml:"constraints,omitempty" yaml:"constraints,omitempty" export:"true" `
Endpoint * EndpointConfig ` description:"Nomad endpoint settings" json:"endpoint,omitempty" toml:"endpoint,omitempty" yaml:"endpoint,omitempty" export:"true" `
Prefix string ` description:"Prefix for nomad service tags." json:"prefix,omitempty" toml:"prefix,omitempty" yaml:"prefix,omitempty" export:"true" `
Stale bool ` description:"Use stale consistency for catalog reads." json:"stale,omitempty" toml:"stale,omitempty" yaml:"stale,omitempty" export:"true" `
ExposedByDefault bool ` description:"Expose Nomad services by default." json:"exposedByDefault,omitempty" toml:"exposedByDefault,omitempty" yaml:"exposedByDefault,omitempty" export:"true" `
RefreshInterval ptypes . Duration ` description:"Interval for polling Nomad API." json:"refreshInterval,omitempty" toml:"refreshInterval,omitempty" yaml:"refreshInterval,omitempty" export:"true" `
AllowEmptyServices bool ` description:"Allow the creation of services without endpoints." json:"allowEmptyServices,omitempty" toml:"allowEmptyServices,omitempty" yaml:"allowEmptyServices,omitempty" export:"true" `
2022-09-19 16:26:08 +02:00
}
// SetDefaults sets the default values for the Nomad Traefik Provider Configuration.
func ( c * Configuration ) SetDefaults ( ) {
2023-03-21 12:00:46 +01:00
defConfig := api . DefaultConfig ( )
c . Endpoint = & EndpointConfig {
Address : defConfig . Address ,
Region : defConfig . Region ,
Token : defConfig . SecretID ,
2023-03-21 16:51:10 +01:00
}
if defConfig . TLSConfig != nil && ( defConfig . TLSConfig . Insecure || defConfig . TLSConfig . CACert != "" || defConfig . TLSConfig . ClientCert != "" || defConfig . TLSConfig . ClientKey != "" ) {
c . Endpoint . TLS = & types . ClientTLS {
2023-03-21 12:00:46 +01:00
CA : defConfig . TLSConfig . CACert ,
Cert : defConfig . TLSConfig . ClientCert ,
Key : defConfig . TLSConfig . ClientKey ,
InsecureSkipVerify : defConfig . TLSConfig . Insecure ,
2023-03-21 16:51:10 +01:00
}
2023-03-21 12:00:46 +01:00
}
2023-03-21 16:51:10 +01:00
2022-09-19 16:26:08 +02:00
c . Prefix = defaultPrefix
c . ExposedByDefault = true
c . RefreshInterval = ptypes . Duration ( 15 * time . Second )
c . DefaultRule = defaultTemplateRule
2024-04-04 05:54:04 -04:00
c . AllowEmptyServices = false
2022-09-19 16:26:08 +02:00
}
2022-06-10 11:32:08 -05:00
type EndpointConfig struct {
2023-03-20 17:44:05 +08:00
// Address is the Nomad endpoint address, if empty it defaults to NOMAD_ADDR or "http://127.0.0.1:4646".
2022-06-10 11:32:08 -05:00
Address string ` description:"The address of the Nomad server, including scheme and port." json:"address,omitempty" toml:"address,omitempty" yaml:"address,omitempty" `
2023-03-20 17:44:05 +08:00
// Region is the Nomad region, if empty it defaults to NOMAD_REGION.
2022-06-10 11:32:08 -05:00
Region string ` description:"Nomad region to use. If not provided, the local agent region is used." json:"region,omitempty" toml:"region,omitempty" yaml:"region,omitempty" `
// Token is the ACL token to connect with Nomad, if empty it defaults to NOMAD_TOKEN.
Token string ` description:"Token is used to provide a per-request ACL token." json:"token,omitempty" toml:"token,omitempty" yaml:"token,omitempty" loggable:"false" `
TLS * types . ClientTLS ` description:"Configure TLS." json:"tls,omitempty" toml:"tls,omitempty" yaml:"tls,omitempty" export:"true" `
EndpointWaitTime ptypes . Duration ` description:"WaitTime limits how long a Watch will block. If not provided, the agent default values will be used" json:"endpointWaitTime,omitempty" toml:"endpointWaitTime,omitempty" yaml:"endpointWaitTime,omitempty" export:"true" `
}
2022-09-19 16:26:08 +02:00
// Provider holds configuration along with the namespace it will discover services in.
type Provider struct {
Configuration
name string
namespace string
2022-06-10 11:32:08 -05:00
client * api . Client // client for Nomad API
defaultRuleTpl * template . Template // default routing rule
}
// SetDefaults sets the default values for the Nomad Traefik Provider.
func ( p * Provider ) SetDefaults ( ) {
2023-03-21 15:50:06 +01:00
p . Configuration . SetDefaults ( )
2022-06-10 11:32:08 -05:00
}
// Init the Nomad Traefik Provider.
func ( p * Provider ) Init ( ) error {
2022-09-19 16:26:08 +02:00
if p . namespace == api . AllNamespacesNamespace {
return errors . New ( "wildcard namespace not supported" )
}
2022-06-10 11:32:08 -05:00
defaultRuleTpl , err := provider . MakeDefaultRuleTemplate ( p . DefaultRule , nil )
if err != nil {
return fmt . Errorf ( "error while parsing default rule: %w" , err )
}
p . defaultRuleTpl = defaultRuleTpl
2022-09-19 16:26:08 +02:00
// In case they didn't initialize Provider with BuildProviders
if p . name == "" {
p . name = providerName
}
2022-06-10 11:32:08 -05:00
return nil
}
// Provide allows the Nomad Traefik Provider to provide configurations to traefik
// using the given configuration channel.
func ( p * Provider ) Provide ( configurationChan chan <- dynamic . Message , pool * safe . Pool ) error {
var err error
2022-09-19 16:26:08 +02:00
p . client , err = createClient ( p . namespace , p . Endpoint )
2022-06-10 11:32:08 -05:00
if err != nil {
return fmt . Errorf ( "failed to create nomad API client: %w" , err )
}
pool . GoCtx ( func ( routineCtx context . Context ) {
2022-11-21 18:36:05 +01:00
logger := log . Ctx ( routineCtx ) . With ( ) . Str ( logs . ProviderName , p . name ) . Logger ( )
ctxLog := logger . WithContext ( routineCtx )
2022-06-10 11:32:08 -05:00
operation := func ( ) error {
ctx , cancel := context . WithCancel ( ctxLog )
defer cancel ( )
// load initial configuration
if err := p . loadConfiguration ( ctx , configurationChan ) ; err != nil {
return fmt . Errorf ( "failed to load initial nomad services: %w" , err )
}
// issue periodic refreshes in the background
// (Nomad does not support Watch style observations)
ticker := time . NewTicker ( time . Duration ( p . RefreshInterval ) )
defer ticker . Stop ( )
// enter loop where we wait for and respond to notifications
for {
select {
case <- ctx . Done ( ) :
return nil
case <- ticker . C :
}
// load services due to refresh
if err := p . loadConfiguration ( ctx , configurationChan ) ; err != nil {
return fmt . Errorf ( "failed to refresh nomad services: %w" , err )
}
}
}
failure := func ( err error , d time . Duration ) {
2022-11-21 18:36:05 +01:00
logger . Error ( ) . Err ( err ) . Msgf ( "Provider connection error, retrying in %s" , d )
2022-06-10 11:32:08 -05:00
}
if retryErr := backoff . RetryNotify (
safe . OperationWithRecover ( operation ) ,
backoff . WithContext ( job . NewBackOff ( backoff . NewExponentialBackOff ( ) ) , ctxLog ) ,
failure ,
) ; retryErr != nil {
2022-11-21 18:36:05 +01:00
logger . Error ( ) . Err ( retryErr ) . Msg ( "Cannot connect to Nomad server" )
2022-06-10 11:32:08 -05:00
}
} )
return nil
}
func ( p * Provider ) loadConfiguration ( ctx context . Context , configurationC chan <- dynamic . Message ) error {
2024-04-04 05:54:04 -04:00
var items [ ] item
var err error
if p . AllowEmptyServices {
items , err = p . getNomadServiceDataWithEmptyServices ( ctx )
if err != nil {
return err
}
} else {
items , err = p . getNomadServiceData ( ctx )
if err != nil {
return err
}
2022-06-10 11:32:08 -05:00
}
2024-04-04 05:54:04 -04:00
2022-06-10 11:32:08 -05:00
configurationC <- dynamic . Message {
2022-09-19 16:26:08 +02:00
ProviderName : p . name ,
2022-06-10 11:32:08 -05:00
Configuration : p . buildConfig ( ctx , items ) ,
}
return nil
}
func ( p * Provider ) getNomadServiceData ( ctx context . Context ) ( [ ] item , error ) {
// first, get list of service stubs
opts := & api . QueryOptions { AllowStale : p . Stale }
opts = opts . WithContext ( ctx )
stubs , _ , err := p . client . Services ( ) . List ( opts )
if err != nil {
return nil , err
}
var items [ ] item
for _ , stub := range stubs {
for _ , service := range stub . Services {
2022-11-21 18:36:05 +01:00
logger := log . Ctx ( ctx ) . With ( ) . Str ( "serviceName" , service . ServiceName ) . Logger ( )
2022-06-10 11:32:08 -05:00
2022-08-01 17:52:08 +02:00
extraConf := p . getExtraConf ( service . Tags )
if ! extraConf . Enable {
2022-11-21 18:36:05 +01:00
logger . Debug ( ) . Msg ( "Filter Nomad service that is not enabled" )
2022-06-10 11:32:08 -05:00
continue
}
matches , err := constraints . MatchTags ( service . Tags , p . Constraints )
if err != nil {
2022-11-21 18:36:05 +01:00
logger . Error ( ) . Err ( err ) . Msg ( "Error matching constraint expressions" )
2022-06-10 11:32:08 -05:00
continue
}
if ! matches {
2022-11-21 18:36:05 +01:00
logger . Debug ( ) . Msgf ( "Filter Nomad service not matching constraints: %q" , p . Constraints )
2022-06-10 11:32:08 -05:00
continue
}
instances , err := p . fetchService ( ctx , service . ServiceName )
if err != nil {
return nil , err
}
for _ , i := range instances {
items = append ( items , item {
ID : i . ID ,
Name : i . ServiceName ,
Namespace : i . Namespace ,
Node : i . NodeID ,
Datacenter : i . Datacenter ,
Address : i . Address ,
Port : i . Port ,
Tags : i . Tags ,
2022-08-01 17:52:08 +02:00
ExtraConf : p . getExtraConf ( i . Tags ) ,
2022-06-10 11:32:08 -05:00
} )
}
}
}
return items , nil
}
2024-04-04 05:54:04 -04:00
func ( p * Provider ) getNomadServiceDataWithEmptyServices ( ctx context . Context ) ( [ ] item , error ) {
jobsOpts := & api . QueryOptions { AllowStale : p . Stale }
jobsOpts = jobsOpts . WithContext ( ctx )
jobStubs , _ , err := p . client . Jobs ( ) . List ( jobsOpts )
if err != nil {
return nil , err
}
var items [ ] item
// Get Services even when they are scaled down to zero. Currently the nomad service interface does not support this. https://github.com/hashicorp/nomad/issues/19731
for _ , jobStub := range jobStubs {
jobInfoOpts := & api . QueryOptions { }
jobInfoOpts = jobInfoOpts . WithContext ( ctx )
job , _ , err := p . client . Jobs ( ) . Info ( jobStub . ID , jobInfoOpts )
if err != nil {
return nil , err
}
for _ , taskGroup := range job . TaskGroups {
services := [ ] * api . Service { }
// Get all services in job -> taskgroup
services = append ( services , taskGroup . Services ... )
// Get all services in job -> taskgroup -> tasks
for _ , task := range taskGroup . Tasks {
services = append ( services , task . Services ... )
}
for _ , service := range services {
logger := log . Ctx ( ctx ) . With ( ) . Str ( "serviceName" , service . TaskName ) . Logger ( )
extraConf := p . getExtraConf ( service . Tags )
if ! extraConf . Enable {
logger . Debug ( ) . Msg ( "Filter Nomad service that is not enabled" )
continue
}
matches , err := constraints . MatchTags ( service . Tags , p . Constraints )
if err != nil {
logger . Error ( ) . Err ( err ) . Msg ( "Error matching constraint expressions" )
continue
}
if ! matches {
logger . Debug ( ) . Msgf ( "Filter Nomad service not matching constraints: %q" , p . Constraints )
continue
}
if nil != taskGroup . Scaling && * taskGroup . Scaling . Enabled && * taskGroup . Count == 0 {
// Add items without address
items = append ( items , item {
// Create a unique id for non registered services
ID : fmt . Sprintf ( "%s-%s-%s-%s-%s" , * job . Namespace , * job . Name , * taskGroup . Name , service . TaskName , service . Name ) ,
Name : service . Name ,
Namespace : * job . Namespace ,
Node : "" ,
Datacenter : "" ,
Address : "" ,
Port : - 1 ,
Tags : service . Tags ,
ExtraConf : p . getExtraConf ( service . Tags ) ,
} )
} else {
instances , err := p . fetchService ( ctx , service . Name )
if err != nil {
return nil , err
}
for _ , i := range instances {
items = append ( items , item {
ID : i . ID ,
Name : i . ServiceName ,
Namespace : i . Namespace ,
Node : i . NodeID ,
Datacenter : i . Datacenter ,
Address : i . Address ,
Port : i . Port ,
Tags : i . Tags ,
ExtraConf : p . getExtraConf ( i . Tags ) ,
} )
}
}
}
}
}
return items , nil
}
2023-03-22 12:00:25 +01:00
// getExtraConf returns a configuration with settings which are not part of the dynamic configuration (e.g. "<prefix>.enable").
func ( p * Provider ) getExtraConf ( tags [ ] string ) configuration {
labels := tagsToLabels ( tags , p . Prefix )
enabled := p . ExposedByDefault
if v , exists := labels [ "traefik.enable" ] ; exists {
enabled = strings . EqualFold ( v , "true" )
}
var canary bool
if v , exists := labels [ "traefik.nomad.canary" ] ; exists {
canary = strings . EqualFold ( v , "true" )
}
return configuration { Enable : enabled , Canary : canary }
}
2022-06-10 11:32:08 -05:00
// fetchService queries Nomad API for services matching name,
// that also have the <prefix>.enable=true set in its tags.
func ( p * Provider ) fetchService ( ctx context . Context , name string ) ( [ ] * api . ServiceRegistration , error ) {
var tagFilter string
if ! p . ExposedByDefault {
tagFilter = fmt . Sprintf ( ` Tags contains %q ` , fmt . Sprintf ( "%s.enable=true" , p . Prefix ) )
}
// TODO: Nomad currently (v1.3.0) does not support health checks,
// and as such does not yet return health status information.
// When it does, refactor this section to include health status.
opts := & api . QueryOptions { AllowStale : p . Stale , Filter : tagFilter }
opts = opts . WithContext ( ctx )
services , _ , err := p . client . Services ( ) . Get ( name , opts )
if err != nil {
return nil , fmt . Errorf ( "failed to fetch services: %w" , err )
}
return services , nil
}
2023-03-22 12:00:25 +01:00
func createClient ( namespace string , endpoint * EndpointConfig ) ( * api . Client , error ) {
config := api . Config {
Address : endpoint . Address ,
Namespace : namespace ,
Region : endpoint . Region ,
SecretID : endpoint . Token ,
WaitTime : time . Duration ( endpoint . EndpointWaitTime ) ,
}
if endpoint . TLS != nil {
config . TLSConfig = & api . TLSConfig {
CACert : endpoint . TLS . CA ,
ClientCert : endpoint . TLS . Cert ,
ClientKey : endpoint . TLS . Key ,
Insecure : endpoint . TLS . InsecureSkipVerify ,
}
}
return api . NewClient ( & config )
}