|
| 1 | +package beholder |
| 2 | + |
| 3 | +import ( |
| 4 | + "context" |
| 5 | + "fmt" |
| 6 | + "time" |
| 7 | + |
| 8 | + "go.opentelemetry.io/otel/attribute" |
| 9 | + "go.opentelemetry.io/otel/metric" |
| 10 | + "go.opentelemetry.io/otel/trace" |
| 11 | + "google.golang.org/protobuf/proto" |
| 12 | + |
| 13 | + "github.com/smartcontractkit/chainlink-common/pkg/beholder/pb" |
| 14 | + "github.com/smartcontractkit/chainlink-common/pkg/config/build" |
| 15 | + "github.com/smartcontractkit/chainlink-common/pkg/logger" |
| 16 | + "github.com/smartcontractkit/chainlink-common/pkg/services" |
| 17 | + "github.com/smartcontractkit/chainlink-common/pkg/timeutil" |
| 18 | +) |
| 19 | + |
| 20 | +// Heartbeat represents a periodic heartbeat service that emits metrics and logs |
| 21 | +type Heartbeat struct { |
| 22 | + services.Service |
| 23 | + eng *services.Engine |
| 24 | + |
| 25 | + beat time.Duration |
| 26 | + emitter Emitter |
| 27 | + meter metric.Meter |
| 28 | + logger logger.Logger |
| 29 | + tracer trace.Tracer |
| 30 | + appID string |
| 31 | + serviceName string |
| 32 | + version string |
| 33 | + commit string |
| 34 | + labels map[string]string |
| 35 | +} |
| 36 | + |
| 37 | +// NewHeartbeat creates a new heartbeat service with custom configuration |
| 38 | +func NewHeartbeat(beat time.Duration, lggr logger.Logger, opts ...HeartbeatOpt) *Heartbeat { |
| 39 | + // Setup default emitter, meter, and tracer |
| 40 | + noopClient := NewNoopClient() |
| 41 | + |
| 42 | + // Create heartbeat with defaults |
| 43 | + h := &Heartbeat{ |
| 44 | + beat: beat, |
| 45 | + logger: lggr, |
| 46 | + emitter: noopClient.Emitter, |
| 47 | + meter: noopClient.Meter, |
| 48 | + tracer: noopClient.Tracer, |
| 49 | + appID: "chainlink", // Default app ID |
| 50 | + serviceName: build.Program, // Default service name |
| 51 | + version: build.Version, // Use build version |
| 52 | + commit: build.ChecksumPrefix, // Use build commit |
| 53 | + labels: make(map[string]string), |
| 54 | + } |
| 55 | + |
| 56 | + // Apply options |
| 57 | + for _, opt := range opts { |
| 58 | + opt(h) |
| 59 | + } |
| 60 | + |
| 61 | + // Build labels from current values |
| 62 | + h.labels = map[string]string{ |
| 63 | + "service": h.serviceName, |
| 64 | + "version": h.version, |
| 65 | + "commit": h.commit, |
| 66 | + } |
| 67 | + if h.appID != "" { |
| 68 | + h.labels["app_id"] = h.appID |
| 69 | + } |
| 70 | + |
| 71 | + // Create service engine |
| 72 | + h.Service, h.eng = services.Config{ |
| 73 | + Name: "BeholderHeartbeat", |
| 74 | + Start: h.start, |
| 75 | + }.NewServiceEngine(lggr) |
| 76 | + |
| 77 | + return h |
| 78 | +} |
| 79 | + |
| 80 | +// HeartbeatOpt is a functional option for configuring the heartbeat |
| 81 | +type HeartbeatOpt func(*Heartbeat) |
| 82 | + |
| 83 | +// WithEmitter sets a custom message emitter for the heartbeat |
| 84 | +func WithEmitter(emitter Emitter) HeartbeatOpt { |
| 85 | + return func(h *Heartbeat) { |
| 86 | + h.emitter = emitter |
| 87 | + } |
| 88 | +} |
| 89 | + |
| 90 | +// WithMeter sets a custom meter for the heartbeat |
| 91 | +func WithMeter(meter metric.Meter) HeartbeatOpt { |
| 92 | + return func(h *Heartbeat) { |
| 93 | + h.meter = meter |
| 94 | + } |
| 95 | +} |
| 96 | + |
| 97 | +// WithTracer sets a custom tracer for the heartbeat |
| 98 | +func WithTracer(tracer trace.Tracer) HeartbeatOpt { |
| 99 | + return func(h *Heartbeat) { |
| 100 | + h.tracer = tracer |
| 101 | + } |
| 102 | +} |
| 103 | + |
| 104 | +// WithAppID sets a custom app ID for the heartbeat |
| 105 | +func WithAppID(appID string) HeartbeatOpt { |
| 106 | + return func(h *Heartbeat) { |
| 107 | + h.appID = appID |
| 108 | + if appID != "" { |
| 109 | + h.labels["app_id"] = appID |
| 110 | + } else { |
| 111 | + delete(h.labels, "app_id") |
| 112 | + } |
| 113 | + } |
| 114 | +} |
| 115 | + |
| 116 | +// WithServiceName sets a custom service name for the heartbeat |
| 117 | +func WithServiceName(serviceName string) HeartbeatOpt { |
| 118 | + return func(h *Heartbeat) { |
| 119 | + h.serviceName = serviceName |
| 120 | + h.labels["service"] = serviceName |
| 121 | + } |
| 122 | +} |
| 123 | + |
| 124 | +// WithVersion sets a custom version for the heartbeat |
| 125 | +func WithVersion(version string) HeartbeatOpt { |
| 126 | + return func(h *Heartbeat) { |
| 127 | + h.version = version |
| 128 | + h.labels["version"] = version |
| 129 | + } |
| 130 | +} |
| 131 | + |
| 132 | +// WithCommit sets a custom commit for the heartbeat |
| 133 | +func WithCommit(commit string) HeartbeatOpt { |
| 134 | + return func(h *Heartbeat) { |
| 135 | + h.commit = commit |
| 136 | + h.labels["commit"] = commit |
| 137 | + } |
| 138 | +} |
| 139 | + |
| 140 | +// WithBeatInterval sets a custom beat interval for the heartbeat |
| 141 | +func WithBeatInterval(beat time.Duration) HeartbeatOpt { |
| 142 | + return func(h *Heartbeat) { |
| 143 | + h.beat = beat |
| 144 | + } |
| 145 | +} |
| 146 | + |
| 147 | +// start initializes and starts the heartbeat service |
| 148 | +func (h *Heartbeat) start(ctx context.Context) error { |
| 149 | + // Create heartbeat metrics |
| 150 | + heartbeatGauge, err := h.meter.Int64Gauge("beholder_heartbeat") |
| 151 | + if err != nil { |
| 152 | + return fmt.Errorf("failed to create heartbeat status gauge: %w", err) |
| 153 | + } |
| 154 | + |
| 155 | + heartbeatCount, err := h.meter.Int64Counter("beholder_heartbeat_count") |
| 156 | + if err != nil { |
| 157 | + return fmt.Errorf("failed to create heartbeat counter: %w", err) |
| 158 | + } |
| 159 | + |
| 160 | + // Define the heartbeat function |
| 161 | + beatFn := func(ctx context.Context) { |
| 162 | + start := time.Now() |
| 163 | + |
| 164 | + // Create a trace span for the heartbeat |
| 165 | + ctx, span := h.tracer.Start(ctx, "beholder_heartbeat", trace.WithAttributes( |
| 166 | + attribute.String("service", h.serviceName), |
| 167 | + attribute.String("app_id", h.appID), |
| 168 | + attribute.String("version", h.version), |
| 169 | + attribute.String("commit", h.commit), |
| 170 | + )) |
| 171 | + defer span.End() |
| 172 | + |
| 173 | + // Record heartbeat metrics |
| 174 | + heartbeatGauge.Record(ctx, 1) |
| 175 | + heartbeatCount.Add(ctx, 1) |
| 176 | + |
| 177 | + // Emit heartbeat message |
| 178 | + |
| 179 | + payload := &pb.BaseMessage{ |
| 180 | + Msg: "beholder heartbeat", |
| 181 | + Labels: h.labels, |
| 182 | + } |
| 183 | + payloadBytes, err := proto.Marshal(payload) |
| 184 | + if err != nil { |
| 185 | + // log error |
| 186 | + h.logger.Errorw("heartbeat marshal protobuf failed", "err", err) |
| 187 | + } |
| 188 | + |
| 189 | + err = h.emitter.Emit(ctx, payloadBytes, |
| 190 | + AttrKeyDataSchema, "/beholder-base-message/versions/1", // required |
| 191 | + AttrKeyDomain, "platform", // required |
| 192 | + AttrKeyEntity, "BaseMessage", // required |
| 193 | + "service", h.serviceName, |
| 194 | + "app_id", h.appID, |
| 195 | + "version", h.version, |
| 196 | + "commit", h.commit, |
| 197 | + "timestamp", start.Unix(), |
| 198 | + ) |
| 199 | + |
| 200 | + if err != nil { |
| 201 | + h.logger.Errorw("heartbeat emit failed", "err", err) |
| 202 | + } |
| 203 | + |
| 204 | + // Log heartbeat |
| 205 | + h.logger.Debugw("beholder heartbeat emitted", |
| 206 | + "service", h.serviceName, |
| 207 | + "app_id", h.appID, |
| 208 | + "version", h.version, |
| 209 | + "commit", h.commit, |
| 210 | + "timestamp", start.Unix(), |
| 211 | + ) |
| 212 | + } |
| 213 | + |
| 214 | + // Start the heartbeat ticker |
| 215 | + // Execute immediately first, then continue with regular intervals |
| 216 | + h.eng.Go(func(ctx context.Context) { |
| 217 | + beatFn(ctx) |
| 218 | + }) |
| 219 | + h.eng.GoTick(timeutil.NewTicker(h.GetBeat), beatFn) |
| 220 | + |
| 221 | + h.logger.Infow("beholder heartbeat service started", |
| 222 | + "service", h.serviceName, |
| 223 | + "beat_interval", h.GetBeat(), |
| 224 | + ) |
| 225 | + |
| 226 | + return nil |
| 227 | +} |
| 228 | + |
| 229 | +// GetBeat returns the heartbeat interval |
| 230 | +func (h *Heartbeat) GetBeat() time.Duration { |
| 231 | + return h.beat |
| 232 | +} |
| 233 | + |
| 234 | +// GetAppID returns the app ID |
| 235 | +func (h *Heartbeat) GetAppID() string { |
| 236 | + return h.appID |
| 237 | +} |
| 238 | + |
| 239 | +// GetServiceName returns the service name |
| 240 | +func (h *Heartbeat) GetServiceName() string { |
| 241 | + return h.serviceName |
| 242 | +} |
| 243 | + |
| 244 | +// GetVersion returns the version |
| 245 | +func (h *Heartbeat) GetVersion() string { |
| 246 | + return h.version |
| 247 | +} |
| 248 | + |
| 249 | +// GetCommit returns the commit |
| 250 | +func (h *Heartbeat) GetCommit() string { |
| 251 | + return h.commit |
| 252 | +} |
| 253 | + |
| 254 | +// GetLabels returns the labels |
| 255 | +func (h *Heartbeat) GetLabels() map[string]string { |
| 256 | + return h.labels |
| 257 | +} |
| 258 | + |
| 259 | +// GetEmitter returns the message emitter |
| 260 | +func (h *Heartbeat) GetEmitter() Emitter { |
| 261 | + return h.emitter |
| 262 | +} |
| 263 | + |
| 264 | +// GetMeter returns the meter |
| 265 | +func (h *Heartbeat) GetMeter() metric.Meter { |
| 266 | + return h.meter |
| 267 | +} |
| 268 | + |
| 269 | +// GetLogger returns the logger |
| 270 | +func (h *Heartbeat) GetLogger() logger.Logger { |
| 271 | + return h.logger |
| 272 | +} |
| 273 | + |
| 274 | +// GetTracer returns the tracer |
| 275 | +func (h *Heartbeat) GetTracer() trace.Tracer { |
| 276 | + return h.tracer |
| 277 | +} |
0 commit comments