Files
pgsql-broker/pkg/broker/database_instance.go

327 lines
7.9 KiB
Go

package broker
import (
"context"
"encoding/json"
"fmt"
"os"
"sync"
"time"
"git.warky.dev/wdevs/pgsql-broker/pkg/broker/adapter"
"git.warky.dev/wdevs/pgsql-broker/pkg/broker/config"
"git.warky.dev/wdevs/pgsql-broker/pkg/broker/models"
"git.warky.dev/wdevs/pgsql-broker/pkg/broker/queue"
)
// DatabaseInstance represents a broker instance for a single database
type DatabaseInstance struct {
ID int64
Name string
DatabaseName string
Hostname string
PID int
Version string
config *config.Config
dbConfig *config.DatabaseConfig
db adapter.DBAdapter
logger adapter.Logger
queues map[int]*queue.Queue
queuesMu sync.RWMutex
ctx context.Context
shutdown bool
shutdownMu sync.RWMutex
jobsHandled int64
startTime time.Time
}
// NewDatabaseInstance creates a new database instance
func NewDatabaseInstance(cfg *config.Config, dbCfg *config.DatabaseConfig, db adapter.DBAdapter, logger adapter.Logger, version string, parentCtx context.Context) (*DatabaseInstance, error) {
hostname, err := os.Hostname()
if err != nil {
hostname = "unknown"
}
instance := &DatabaseInstance{
Name: fmt.Sprintf("%s-%s", cfg.Broker.Name, dbCfg.Name),
DatabaseName: dbCfg.Name,
Hostname: hostname,
PID: os.Getpid(),
Version: version,
config: cfg,
dbConfig: dbCfg,
db: db,
logger: logger.With("component", "database-instance").With("database", dbCfg.Name),
queues: make(map[int]*queue.Queue),
ctx: parentCtx,
startTime: time.Now(),
}
return instance, nil
}
// Start begins the database instance
func (i *DatabaseInstance) Start() error {
i.logger.Info("starting database instance", "name", i.Name, "hostname", i.Hostname, "pid", i.PID)
// Connect to database
if err := i.db.Connect(i.ctx); err != nil {
return fmt.Errorf("failed to connect to database: %w", err)
}
// Register instance in database
if err := i.registerInstance(); err != nil {
return fmt.Errorf("failed to register instance: %w", err)
}
i.logger.Info("database instance registered", "id", i.ID)
// Start queues
if err := i.startQueues(); err != nil {
return fmt.Errorf("failed to start queues: %w", err)
}
// Start listening for notifications
if err := i.startListener(); err != nil {
return fmt.Errorf("failed to start listener: %w", err)
}
// Start ping routine
go i.pingRoutine()
i.logger.Info("database instance started successfully")
return nil
}
// Stop gracefully stops the database instance
func (i *DatabaseInstance) Stop() error {
i.shutdownMu.Lock()
if i.shutdown {
i.shutdownMu.Unlock()
return nil
}
i.shutdown = true
i.shutdownMu.Unlock()
i.logger.Info("stopping database instance")
// Stop all queues
i.queuesMu.Lock()
for num, q := range i.queues {
i.logger.Info("stopping queue", "number", num)
if err := q.Stop(); err != nil {
i.logger.Error("failed to stop queue", "number", num, "error", err)
}
}
i.queuesMu.Unlock()
// Update instance status in database
if err := i.shutdownInstance(); err != nil {
i.logger.Error("failed to shutdown instance in database", "error", err)
}
// Close database connection
if err := i.db.Close(); err != nil {
i.logger.Error("failed to close database", "error", err)
}
i.logger.Info("database instance stopped")
return nil
}
// registerInstance registers the instance in the database
func (i *DatabaseInstance) registerInstance() error {
var retval int
var errmsg string
var instanceID int64
err := i.db.QueryRow(i.ctx,
"SELECT p_retval, p_errmsg, p_instance_id FROM broker_register_instance($1, $2, $3, $4, $5)",
i.Name, i.Hostname, i.PID, i.Version, i.dbConfig.QueueCount,
).Scan(&retval, &errmsg, &instanceID)
if err != nil {
return fmt.Errorf("query error: %w", err)
}
if retval > 0 {
return fmt.Errorf("broker_register_instance error: %s", errmsg)
}
i.ID = instanceID
return nil
}
// startQueues initializes and starts all queues
func (i *DatabaseInstance) startQueues() error {
i.queuesMu.Lock()
defer i.queuesMu.Unlock()
for queueNum := 1; queueNum <= i.dbConfig.QueueCount; queueNum++ {
queueCfg := queue.Config{
Number: queueNum,
InstanceID: i.ID,
WorkerCount: 1, // One worker per queue for now
DBAdapter: i.db,
Logger: i.logger,
BufferSize: i.config.Broker.QueueBufferSize,
TimerSeconds: i.config.Broker.QueueTimerSec,
FetchSize: i.config.Broker.FetchQueryQueSize,
}
q := queue.New(queueCfg)
if err := q.Start(queueCfg); err != nil {
return fmt.Errorf("failed to start queue %d: %w", queueNum, err)
}
i.queues[queueNum] = q
i.logger.Info("queue started", "number", queueNum)
}
return nil
}
// startListener starts listening for database notifications
func (i *DatabaseInstance) startListener() error {
handler := func(n *adapter.Notification) {
i.handleNotification(n)
}
if err := i.db.Listen(i.ctx, "broker.event", handler); err != nil {
return fmt.Errorf("failed to start listener: %w", err)
}
return nil
}
// handleNotification processes incoming job notifications
func (i *DatabaseInstance) handleNotification(n *adapter.Notification) {
if i.config.Broker.EnableDebug {
i.logger.Debug("received notification", "channel", n.Channel, "payload", n.Payload)
}
var job models.Job
if err := json.Unmarshal([]byte(n.Payload), &job); err != nil {
i.logger.Error("failed to unmarshal notification", "error", err, "payload", n.Payload)
return
}
if job.ID <= 0 {
i.logger.Warn("notification missing job ID", "payload", n.Payload)
return
}
if job.JobQueue <= 0 {
i.logger.Warn("notification missing queue number", "job_id", job.ID)
return
}
// Get the queue
i.queuesMu.RLock()
q, exists := i.queues[job.JobQueue]
i.queuesMu.RUnlock()
if !exists {
i.logger.Warn("queue not found for job", "job_id", job.ID, "queue", job.JobQueue)
return
}
// Add job to queue
if err := q.AddJob(job); err != nil {
i.logger.Error("failed to add job to queue", "job_id", job.ID, "queue", job.JobQueue, "error", err)
}
}
// pingRoutine periodically updates the instance status in the database
func (i *DatabaseInstance) pingRoutine() {
ticker := time.NewTicker(30 * time.Second)
defer ticker.Stop()
for {
select {
case <-ticker.C:
i.shutdownMu.RLock()
if i.shutdown {
i.shutdownMu.RUnlock()
return
}
i.shutdownMu.RUnlock()
if err := i.ping(); err != nil {
i.logger.Error("ping failed", "error", err)
}
case <-i.ctx.Done():
return
}
}
}
// ping updates the instance ping timestamp
func (i *DatabaseInstance) ping() error {
var retval int
var errmsg string
err := i.db.QueryRow(i.ctx,
"SELECT p_retval, p_errmsg FROM broker_ping_instance($1, $2)",
i.ID, i.jobsHandled,
).Scan(&retval, &errmsg)
if err != nil {
return fmt.Errorf("query error: %w", err)
}
if retval > 0 {
return fmt.Errorf("broker_ping_instance error: %s", errmsg)
}
return nil
}
// shutdownInstance marks the instance as shutdown in the database
func (i *DatabaseInstance) shutdownInstance() error {
var retval int
var errmsg string
err := i.db.QueryRow(i.ctx,
"SELECT p_retval, p_errmsg FROM broker_shutdown_instance($1)",
i.ID,
).Scan(&retval, &errmsg)
if err != nil {
return fmt.Errorf("query error: %w", err)
}
if retval > 0 {
return fmt.Errorf("broker_shutdown_instance error: %s", errmsg)
}
return nil
}
// GetStats returns instance statistics
func (i *DatabaseInstance) GetStats() map[string]interface{} {
i.queuesMu.RLock()
defer i.queuesMu.RUnlock()
stats := map[string]interface{}{
"id": i.ID,
"name": i.Name,
"database_name": i.DatabaseName,
"hostname": i.Hostname,
"pid": i.PID,
"version": i.Version,
"uptime": time.Since(i.startTime).String(),
"jobs_handled": i.jobsHandled,
"queue_count": len(i.queues),
}
queueStats := make(map[int]interface{})
for num, q := range i.queues {
queueStats[num] = q.GetStats()
}
stats["queues"] = queueStats
return stats
}