Files
sendico/api/pkg/discovery/service.go
2026-01-06 17:51:35 +01:00

371 lines
11 KiB
Go

package discovery
import (
"context"
"encoding/json"
"strings"
"sync"
"time"
"github.com/nats-io/nats.go"
"github.com/tech/sendico/pkg/merrors"
msg "github.com/tech/sendico/pkg/messaging"
mb "github.com/tech/sendico/pkg/messaging/broker"
cons "github.com/tech/sendico/pkg/messaging/consumer"
me "github.com/tech/sendico/pkg/messaging/envelope"
"github.com/tech/sendico/pkg/mlogger"
"go.uber.org/zap"
)
type RegistryOption func(*RegistryService)
func WithRegistryKVTTL(ttl time.Duration) RegistryOption {
return func(s *RegistryService) {
if s == nil {
return
}
s.kvOptions = append(s.kvOptions, WithKVTTL(ttl))
}
}
type RegistryService struct {
logger mlogger.Logger
registry *Registry
producer msg.Producer
sender string
consumers []consumerHandler
kv *KVStore
kvWatcher nats.KeyWatcher
kvOptions []KVStoreOption
startOnce sync.Once
stopOnce sync.Once
}
type consumerHandler struct {
consumer msg.Consumer
handler msg.MessageHandlerT
event string
}
func NewRegistryService(logger mlogger.Logger, msgBroker mb.Broker, producer msg.Producer, registry *Registry, sender string, opts ...RegistryOption) (*RegistryService, error) {
if msgBroker == nil {
return nil, merrors.InvalidArgument("discovery registry: broker is nil", "broker")
}
if registry == nil {
registry = NewRegistry()
}
if logger == nil {
return nil, merrors.InvalidArgument("discovery registry: no logger provided", "logger")
}
logger = logger.Named("discovery_registry")
sender = strings.TrimSpace(sender)
if sender == "" {
sender = "discovery"
}
serviceConsumer, err := cons.NewConsumer(logger, msgBroker, ServiceAnnounceEvent())
if err != nil {
return nil, err
}
gatewayConsumer, err := cons.NewConsumer(logger, msgBroker, GatewayAnnounceEvent())
if err != nil {
return nil, err
}
heartbeatConsumer, err := cons.NewConsumer(logger, msgBroker, HeartbeatEvent())
if err != nil {
return nil, err
}
lookupConsumer, err := cons.NewConsumer(logger, msgBroker, LookupRequestEvent())
if err != nil {
return nil, err
}
svc := &RegistryService{
logger: logger,
registry: registry,
producer: producer,
sender: sender,
}
for _, opt := range opts {
if opt != nil {
opt(svc)
}
}
svc.consumers = []consumerHandler{
{consumer: serviceConsumer, event: ServiceAnnounceEvent().ToString(), handler: func(ctx context.Context, env me.Envelope) error {
return svc.handleAnnounce(ctx, env)
}},
{consumer: gatewayConsumer, event: GatewayAnnounceEvent().ToString(), handler: func(ctx context.Context, env me.Envelope) error {
return svc.handleAnnounce(ctx, env)
}},
{consumer: heartbeatConsumer, event: HeartbeatEvent().ToString(), handler: svc.handleHeartbeat},
{consumer: lookupConsumer, event: LookupRequestEvent().ToString(), handler: svc.handleLookup},
}
svc.initKV(msgBroker)
return svc, nil
}
func (s *RegistryService) Start() {
if s == nil {
return
}
s.startOnce.Do(func() {
fields := []zap.Field{zap.Int("consumers", len(s.consumers)), zap.Bool("kv_enabled", s.kv != nil)}
if s.kv != nil {
if bucket := s.kv.Bucket(); bucket != "" {
fields = append(fields, zap.String("kv_bucket", bucket))
}
}
s.logInfo("Discovery registry service starting", fields...)
for _, ch := range s.consumers {
ch := ch
go func() {
if err := ch.consumer.ConsumeMessages(ch.handler); err != nil {
s.logger.Warn("Discovery consumer stopped with error", zap.String("event", ch.event), zap.Error(err))
}
}()
}
s.startKVWatch()
})
}
func (s *RegistryService) Stop() {
if s == nil {
return
}
s.stopOnce.Do(func() {
for _, ch := range s.consumers {
if ch.consumer != nil {
ch.consumer.Close()
}
}
if s.kvWatcher != nil {
_ = s.kvWatcher.Stop()
}
s.logInfo("Discovery registry service stopped")
})
}
func (s *RegistryService) handleAnnounce(_ context.Context, env me.Envelope) error {
var payload Announcement
if err := json.Unmarshal(env.GetData(), &payload); err != nil {
fields := append(envelopeFields(env), zap.Int("data_len", len(env.GetData())), zap.Error(err))
s.logWarn("Failed to decode discovery announce payload", fields...)
return err
}
s.logDebug("Discovery announce received", append(envelopeFields(env), announcementFields(payload)...)...)
if strings.TrimSpace(payload.InstanceID) == "" && strings.TrimSpace(payload.ID) == "" {
fields := append(envelopeFields(env), announcementFields(payload)...)
s.logWarn("Discovery announce missing id and instance id", fields...)
return nil
}
if strings.TrimSpace(payload.InstanceID) == "" {
fields := append(envelopeFields(env), announcementFields(payload)...)
s.logWarn("Discovery announce missing instance id", fields...)
}
now := time.Now()
result := s.registry.UpsertFromAnnouncement(payload, now)
s.persistEntry(result.Entry)
if result.IsNew || result.BecameHealthy {
s.logInfo("Discovery registry entry updated", append(entryFields(result.Entry), zap.Bool("is_new", result.IsNew), zap.Bool("became_healthy", result.BecameHealthy))...)
s.publishRefresh(result.Entry)
}
return nil
}
func (s *RegistryService) handleHeartbeat(_ context.Context, env me.Envelope) error {
var payload Heartbeat
if err := json.Unmarshal(env.GetData(), &payload); err != nil {
fields := append(envelopeFields(env), zap.Int("data_len", len(env.GetData())), zap.Error(err))
s.logWarn("Failed to decode discovery heartbeat payload", fields...)
return err
}
s.logDebug("Discovery heartbeat received", append(envelopeFields(env), zap.String("id", payload.ID), zap.String("instance_id", payload.InstanceID), zap.String("status", payload.Status))...)
if strings.TrimSpace(payload.InstanceID) == "" && strings.TrimSpace(payload.ID) == "" {
return nil
}
if strings.TrimSpace(payload.InstanceID) == "" {
fields := append(envelopeFields(env), zap.String("id", payload.ID))
s.logWarn("Discovery heartbeat missing instance id", fields...)
}
ts := time.Unix(payload.TS, 0)
if ts.Unix() <= 0 {
ts = time.Now()
}
results := s.registry.UpdateHeartbeat(payload.ID, payload.InstanceID, strings.TrimSpace(payload.Status), ts, time.Now())
if len(results) == 0 {
s.logDebug("Discovery heartbeat ignored: entry not found", zap.String("id", payload.ID), zap.String("instance_id", payload.InstanceID))
return nil
}
for _, result := range results {
if result.BecameHealthy {
s.logInfo("Discovery registry entry became healthy", append(entryFields(result.Entry), zap.String("status", result.Entry.Status))...)
s.publishRefresh(result.Entry)
}
s.persistEntry(result.Entry)
}
return nil
}
func (s *RegistryService) handleLookup(_ context.Context, env me.Envelope) error {
if s.producer == nil {
s.logWarn("Discovery lookup request ignored: producer not configured", envelopeFields(env)...)
return nil
}
var payload LookupRequest
if err := json.Unmarshal(env.GetData(), &payload); err != nil {
fields := append(envelopeFields(env), zap.Int("data_len", len(env.GetData())), zap.Error(err))
s.logWarn("Failed to decode discovery lookup payload", fields...)
return err
}
resp := s.registry.Lookup(time.Now())
resp.RequestID = strings.TrimSpace(payload.RequestID)
s.logDebug("Discovery lookup prepared", zap.String("request_id", resp.RequestID), zap.Int("services", len(resp.Services)), zap.Int("gateways", len(resp.Gateways)))
if err := s.producer.SendMessage(NewLookupResponseEnvelope(s.sender, resp)); err != nil {
fields := []zap.Field{zap.String("request_id", resp.RequestID), zap.Error(err)}
s.logWarn("Failed to publish discovery lookup response", fields...)
return err
}
return nil
}
func (s *RegistryService) publishRefresh(entry RegistryEntry) {
if s == nil || s.producer == nil {
return
}
payload := RefreshEvent{
InstanceID: entry.InstanceID,
Service: entry.Service,
Rail: entry.Rail,
Network: entry.Network,
Message: "new module available",
}
if err := s.producer.SendMessage(NewRefreshUIEnvelope(s.sender, payload)); err != nil {
fields := append(entryFields(entry), zap.Error(err))
s.logWarn("Failed to publish discovery refresh event", fields...)
}
}
type jetStreamProvider interface {
JetStream() nats.JetStreamContext
}
func (s *RegistryService) initKV(msgBroker mb.Broker) {
if s == nil || msgBroker == nil {
return
}
provider, ok := msgBroker.(jetStreamProvider)
if !ok {
s.logInfo("Discovery KV disabled: broker does not support JetStream")
return
}
js := provider.JetStream()
if js == nil {
s.logWarn("Discovery KV disabled: JetStream not configured")
return
}
store, err := NewKVStore(s.logger, js, "", s.kvOptions...)
if err != nil {
s.logWarn("Failed to initialise discovery KV store", zap.Error(err))
return
}
s.kv = store
}
func (s *RegistryService) startKVWatch() {
if s == nil || s.kv == nil {
return
}
watcher, err := s.kv.WatchAll()
if err != nil {
s.logWarn("Failed to start discovery KV watch", zap.Error(err))
return
}
s.kvWatcher = watcher
if bucket := s.kv.Bucket(); bucket != "" {
s.logInfo("Discovery KV watch started", zap.String("bucket", bucket))
}
go s.consumeKVUpdates(watcher)
}
func (s *RegistryService) consumeKVUpdates(watcher nats.KeyWatcher) {
if s == nil || watcher == nil {
return
}
initial := true
initialCount := 0
for entry := range watcher.Updates() {
if entry == nil {
if initial {
fields := []zap.Field{zap.Int("entries", initialCount)}
if s.kv != nil {
if bucket := s.kv.Bucket(); bucket != "" {
fields = append(fields, zap.String("bucket", bucket))
}
}
s.logInfo("Discovery KV initial sync complete", fields...)
initial = false
}
continue
}
if initial && entry.Operation() == nats.KeyValuePut {
initialCount++
}
switch entry.Operation() {
case nats.KeyValueDelete, nats.KeyValuePurge:
key := registryKeyFromKVKey(entry.Key())
if key != "" {
if s.registry.Delete(key) {
s.logInfo("Discovery registry entry removed", zap.String("key", key))
}
}
continue
case nats.KeyValuePut:
default:
continue
}
var payload RegistryEntry
if err := json.Unmarshal(entry.Value(), &payload); err != nil {
s.logWarn("Failed to decode discovery KV entry", zap.String("key", entry.Key()), zap.Error(err))
continue
}
result := s.registry.UpsertEntry(payload, time.Now())
if result.IsNew || result.BecameHealthy {
s.logInfo("Discovery registry entry updated from KV", append(entryFields(result.Entry), zap.Bool("is_new", result.IsNew), zap.Bool("became_healthy", result.BecameHealthy))...)
s.publishRefresh(result.Entry)
}
}
}
func (s *RegistryService) persistEntry(entry RegistryEntry) {
if s == nil || s.kv == nil {
return
}
if err := s.kv.Put(entry); err != nil {
s.logWarn("Failed to persist discovery entry", append(entryFields(entry), zap.Error(err))...)
}
}
func (s *RegistryService) logWarn(message string, fields ...zap.Field) {
if s == nil {
return
}
s.logger.Warn(message, fields...)
}
func (s *RegistryService) logDebug(message string, fields ...zap.Field) {
if s == nil {
return
}
s.logger.Debug(message, fields...)
}
func (s *RegistryService) logInfo(message string, fields ...zap.Field) {
if s == nil {
return
}
s.logger.Info(message, fields...)
}