|
1 | 1 | package main |
2 | 2 |
|
3 | 3 | import ( |
| 4 | + "context" |
4 | 5 | "os" |
| 6 | + "os/signal" |
| 7 | + "sync" |
| 8 | + "syscall" |
5 | 9 | "time" |
6 | 10 |
|
7 | 11 | "github.com/threatwinds/go-sdk/catcher" |
8 | 12 | "github.com/utmstack/UTMStack/agent-manager/agent" |
9 | 13 | "github.com/utmstack/UTMStack/agent-manager/database" |
| 14 | + "github.com/utmstack/UTMStack/agent-manager/recovery" |
10 | 15 | "github.com/utmstack/UTMStack/agent-manager/updates" |
11 | 16 | ) |
12 | 17 |
|
| 18 | +type recoveryProvider struct { |
| 19 | + server *agent.AgentService |
| 20 | + lastSeenServ *agent.LastSeenService |
| 21 | +} |
| 22 | + |
| 23 | +func (p *recoveryProvider) GetStream(agentID uint) (recovery.AgentStream, bool) { |
| 24 | + p.server.AgentStreamMutex.Lock() |
| 25 | + defer p.server.AgentStreamMutex.Unlock() |
| 26 | + s, ok := p.server.AgentStreamMap[agentID] |
| 27 | + if !ok { |
| 28 | + return nil, false |
| 29 | + } |
| 30 | + return s, true |
| 31 | +} |
| 32 | + |
| 33 | +func (p *recoveryProvider) IsOnline(agentID uint) bool { |
| 34 | + if p.lastSeenServ == nil { |
| 35 | + return false |
| 36 | + } |
| 37 | + st, _, err := p.lastSeenServ.GetLastSeenStatus(agentID, "agent") |
| 38 | + if err != nil { |
| 39 | + return false |
| 40 | + } |
| 41 | + return st == agent.Status_ONLINE |
| 42 | +} |
| 43 | + |
13 | 44 | func main() { |
14 | 45 | catcher.Info("Starting Agent Manager", map[string]any{"process": "agent-manager"}) |
15 | 46 |
|
16 | | - err := database.MigrateDatabase() |
17 | | - if err != nil { |
| 47 | + ctx, stop := signal.NotifyContext(context.Background(), syscall.SIGTERM, syscall.SIGINT) |
| 48 | + defer stop() |
| 49 | + |
| 50 | + if err := database.MigrateDatabase(); err != nil { |
18 | 51 | _ = catcher.Error("failed to migrate database", err, map[string]any{"process": "agent-manager"}) |
19 | 52 | time.Sleep(5 * time.Second) |
20 | 53 | os.Exit(1) |
21 | 54 | } |
22 | 55 |
|
| 56 | + if err := agent.InitAgentService(); err != nil { |
| 57 | + _ = catcher.Error("failed to init agent service", err, map[string]any{"process": "agent-manager"}) |
| 58 | + time.Sleep(5 * time.Second) |
| 59 | + os.Exit(1) |
| 60 | + } |
| 61 | + |
| 62 | + go agent.InitCollectorService() |
| 63 | + agent.InitLastSeenService() |
| 64 | + |
| 65 | + recovery.SetStreamProvider(&recoveryProvider{ |
| 66 | + server: agent.AgentServ, |
| 67 | + lastSeenServ: agent.LastSeenServ, |
| 68 | + }) |
| 69 | + agent.RegisterRecoveryHooks( |
| 70 | + recovery.OnAgentConnect, |
| 71 | + recovery.OnAgentRegister, |
| 72 | + recovery.OnAgentUpdate, |
| 73 | + recovery.OnCommandResult, |
| 74 | + func(agentID uint) sync.Locker { return recovery.StreamMutex.For(agentID) }, |
| 75 | + ) |
| 76 | + if err := recovery.Init(ctx, database.GetDB().GormDB()); err != nil { |
| 77 | + _ = catcher.Error("failed to init recovery", err, map[string]any{"process": "agent-manager"}) |
| 78 | + } |
| 79 | + |
23 | 80 | go updates.InitUpdatesManager() |
24 | | - agent.InitGrpcServer() |
| 81 | + go agent.StartGrpcServer() |
| 82 | + |
| 83 | + <-ctx.Done() |
| 84 | + catcher.Info("Shutdown signal received; draining recovery dispatches", map[string]any{"process": "agent-manager"}) |
| 85 | + if err := recovery.Shutdown(15 * time.Second); err != nil { |
| 86 | + _ = catcher.Error("recovery shutdown error", err, map[string]any{"process": "agent-manager"}) |
| 87 | + } |
| 88 | + catcher.Info("Agent Manager shut down cleanly", map[string]any{"process": "agent-manager"}) |
25 | 89 | } |
0 commit comments