package consul import ( "fmt" "time" "github.com/armon/go-metrics" "github.com/armon/go-metrics/prometheus" "github.com/hashicorp/consul/acl" "github.com/hashicorp/consul/agent/structs" ) var SessionGauges = []prometheus.GaugeDefinition{ { Name: []string{"session_ttl", "active"}, Help: "Tracks the active number of sessions being tracked.", }, { Name: []string{"raft", "applied_index"}, Help: "Represents the raft applied index.", }, { Name: []string{"raft", "last_index"}, Help: "Represents the raft last index.", }, } var SessionSummaries = []prometheus.SummaryDefinition{ { Name: []string{"session_ttl", "invalidate"}, Help: "Measures the time spent invalidating an expired session.", }, } const ( // maxInvalidateAttempts limits how many invalidate attempts are made maxInvalidateAttempts = 6 // invalidateRetryBase is a baseline retry time invalidateRetryBase = 10 * time.Second ) // initializeSessionTimers is used when a leader is newly elected to create // a new map to track session expiration and to reset all the timers from // the previously known set of timers. func (s *Server) initializeSessionTimers() error { // Scan all sessions and reset their timer state := s.fsm.State() _, sessions, err := state.SessionListAll(nil) if err != nil { return err } for _, session := range sessions { if err := s.resetSessionTimer(session); err != nil { return err } } return nil } // resetSessionTimer is used to renew the TTL of a session. // This can be used for new sessions and existing ones. A session // will be faulted in if not given. func (s *Server) resetSessionTimer(session *structs.Session) error { // Bail if the session has no TTL, fast-path some common inputs switch session.TTL { case "", "0", "0s", "0m", "0h": return nil } // Parse the TTL, and skip if zero time ttl, err := time.ParseDuration(session.TTL) if err != nil { return fmt.Errorf("Invalid Session TTL '%s': %v", session.TTL, err) } if ttl == 0 { return nil } s.createSessionTimer(session.ID, ttl, &session.EnterpriseMeta) return nil } func (s *Server) createSessionTimer(id string, ttl time.Duration, entMeta *acl.EnterpriseMeta) { // Reset the session timer // Adjust the given TTL by the TTL multiplier. This is done // to give a client a grace period and to compensate for network // and processing delays. The contract is that a session is not expired // before the TTL, but there is no explicit promise about the upper // bound so this is allowable. ttl = ttl * structs.SessionTTLMultiplier s.sessionTimers.ResetOrCreate(id, ttl, func() { s.invalidateSession(id, entMeta) }) } // invalidateSession is invoked when a session TTL is reached and we // need to invalidate the session. func (s *Server) invalidateSession(id string, entMeta *acl.EnterpriseMeta) { defer metrics.MeasureSince([]string{"session_ttl", "invalidate"}, time.Now()) // Clear the session timer s.sessionTimers.Del(id) // Create a session destroy request args := structs.SessionRequest{ Datacenter: s.config.Datacenter, Op: structs.SessionDestroy, Session: structs.Session{ ID: id, }, } if entMeta != nil { args.Session.EnterpriseMeta = *entMeta } // Retry with exponential backoff to invalidate the session for attempt := uint(0); attempt < maxInvalidateAttempts; attempt++ { // TODO(rpc-metrics-improv): Double check request name here _, err := s.leaderRaftApply("Session.Check", structs.SessionRequestType, args) if err == nil { s.logger.Debug("Session TTL expired", "session", id) return } s.logger.Error("Invalidation failed", "error", err) time.Sleep((1 << attempt) * invalidateRetryBase) } s.logger.Error("maximum revoke attempts reached for session", "error", id) } // clearSessionTimer is used to clear the session time for // a single session. This is used when a session is destroyed // explicitly and no longer needed. func (s *Server) clearSessionTimer(id string) error { s.sessionTimers.Stop(id) return nil } // clearAllSessionTimers is used when a leader is stepping // down and we no longer need to track any session timers. func (s *Server) clearAllSessionTimers() { s.sessionTimers.StopAll() } // updateMetrics is a long running routine used to update a // number of server periodic metrics func (s *Server) updateMetrics() { for { select { case <-time.After(time.Second): metrics.SetGauge([]string{"session_ttl", "active"}, float32(s.sessionTimers.Len())) metrics.SetGauge([]string{"raft", "applied_index"}, float32(s.raft.AppliedIndex())) metrics.SetGauge([]string{"raft", "last_index"}, float32(s.raft.LastIndex())) case <-s.shutdownCh: return } } }