apollo-backend/cmd/apollo-scheduler/main.go

227 lines
5 KiB
Go
Raw Normal View History

2021-07-08 23:03:46 +00:00
package main
import (
"context"
"fmt"
"log"
"os"
"os/signal"
"syscall"
"time"
2021-07-09 02:09:14 +00:00
"github.com/DataDog/datadog-go/statsd"
2021-07-08 23:03:46 +00:00
"github.com/adjust/rmq/v4"
"github.com/go-co-op/gocron"
"github.com/go-redis/redis/v8"
"github.com/jackc/pgx/v4"
"github.com/jackc/pgx/v4/pgxpool"
"github.com/joho/godotenv"
"github.com/sirupsen/logrus"
)
func main() {
_ = godotenv.Load()
errChan := make(chan error, 10)
go logErrors(errChan)
ctx, cancel := context.WithCancel(context.Background())
var logger *logrus.Logger
{
logger = logrus.New()
if os.Getenv("ENV") == "" {
logger.SetLevel(logrus.DebugLevel)
} else {
logger.SetFormatter(&logrus.TextFormatter{
DisableColors: true,
FullTimestamp: true,
})
}
}
2021-07-09 02:09:14 +00:00
statsd, err := statsd.New("127.0.0.1:8125")
if err != nil {
logger.WithFields(logrus.Fields{
"err": err,
}).Error("failed to set up stats")
}
2021-07-08 23:03:46 +00:00
// Set up Postgres connection
var pool *pgxpool.Pool
{
config, err := pgxpool.ParseConfig(os.Getenv("DATABASE_CONNECTION_POOL_URL"))
if err != nil {
panic(err)
}
// Setting the build statement cache to nil helps this work with pgbouncer
config.ConnConfig.BuildStatementCache = nil
config.ConnConfig.PreferSimpleProtocol = true
pool, err = pgxpool.ConnectConfig(ctx, config)
if err != nil {
panic(err)
}
defer pool.Close()
}
// Set up Redis connection
var redisConn *redis.Client
{
2021-07-08 23:26:15 +00:00
opt, err := redis.ParseURL(os.Getenv("REDISCLOUD_URL"))
if err != nil {
panic(err)
}
2021-07-08 23:03:46 +00:00
2021-07-08 23:26:15 +00:00
redisConn = redis.NewClient(opt)
2021-07-08 23:03:46 +00:00
if err := redisConn.Ping(ctx).Err(); err != nil {
panic(err)
}
}
// Set up queues
var (
notificationsQueue rmq.Queue
)
{
connection, err := rmq.OpenConnectionWithRedisClient("producer", redisConn, errChan)
if err != nil {
panic(err)
}
notificationsQueue, err = connection.OpenQueue("notifications")
if err != nil {
panic(err)
}
}
s := gocron.NewScheduler(time.UTC)
2021-07-09 02:09:14 +00:00
s.Every(1).Second().Do(func() { enqueueAccounts(ctx, logger, statsd, pool, redisConn, notificationsQueue) })
2021-07-08 23:03:46 +00:00
s.StartAsync()
signals := make(chan os.Signal, 1)
2021-07-09 01:07:01 +00:00
signal.Notify(signals, syscall.SIGINT, syscall.SIGTERM)
2021-07-08 23:03:46 +00:00
defer signal.Stop(signals)
<-signals // wait for signal
cancel()
go func() {
<-signals // hard exit on second signal (in case shutdown gets stuck)
os.Exit(1)
}()
s.Stop()
}
2021-07-09 02:09:14 +00:00
func enqueueAccounts(ctx context.Context, logger *logrus.Logger, statsd *statsd.Client, pool *pgxpool.Pool, redisConn *redis.Client, queue rmq.Queue) {
2021-07-09 02:15:28 +00:00
start := time.Now()
2021-07-09 01:07:01 +00:00
now := float64(time.Now().UnixNano()/int64(time.Millisecond)) / 1000
2021-07-09 02:09:14 +00:00
// Start looking for accounts that were last checked at least 5 seconds ago
// and at most 6 seconds ago. Also look for accounts that haven't been checked
// in over a minute.
2021-07-09 02:15:28 +00:00
ts := start.Unix()
left := ts - 6
right := left + 1
2021-07-09 02:09:14 +00:00
expired := ts - 60
2021-07-09 00:53:09 +00:00
2021-07-08 23:03:46 +00:00
ids := []int64{}
err := pool.BeginFunc(ctx, func(tx pgx.Tx) error {
stmt := `
WITH account AS (
SELECT id
FROM accounts
2021-07-09 01:01:45 +00:00
WHERE
2021-07-09 02:09:14 +00:00
last_checked_at BETWEEN $1 AND $2
OR last_checked_at < $3
ORDER BY last_checked_at
2021-07-08 23:03:46 +00:00
)
UPDATE accounts
2021-07-09 02:09:14 +00:00
SET last_enqueued_at = $4
2021-07-08 23:03:46 +00:00
WHERE accounts.id IN(SELECT id FROM account)
RETURNING accounts.id`
2021-07-09 02:15:28 +00:00
rows, err := tx.Query(ctx, stmt, left, right, expired, now)
2021-07-08 23:03:46 +00:00
if err != nil {
return err
}
defer rows.Close()
for rows.Next() {
var id int64
rows.Scan(&id)
ids = append(ids, id)
}
return nil
})
if err != nil {
logger.WithFields(logrus.Fields{
"err": err,
}).Error("failed to fetch batch of accounts")
return
}
logger.WithFields(logrus.Fields{
"count": len(ids),
2021-07-09 02:15:28 +00:00
"start": left,
"end": right,
2021-07-08 23:03:46 +00:00
}).Debug("enqueueing account batch")
2021-07-09 00:17:20 +00:00
enqueued := 0
2021-07-09 00:26:01 +00:00
skipped := 0
2021-07-09 02:09:14 +00:00
failed := 0
2021-07-08 23:03:46 +00:00
for _, id := range ids {
payload := fmt.Sprintf("%d", id)
2021-07-09 01:44:06 +00:00
lockKey := fmt.Sprintf("locks:accounts:%s", payload)
_, err := redisConn.Get(ctx, lockKey).Result()
2021-07-09 01:50:45 +00:00
if err == nil {
2021-07-09 00:26:01 +00:00
skipped++
2021-07-08 23:03:46 +00:00
continue
2021-07-09 01:50:45 +00:00
} else if err != redis.Nil {
2021-07-09 01:44:06 +00:00
logger.WithFields(logrus.Fields{
"lockKey": lockKey,
"err": err,
}).Error("failed to check for account lock")
2021-07-08 23:03:46 +00:00
}
2021-07-09 00:26:01 +00:00
2021-07-09 01:44:06 +00:00
if err := redisConn.SetEX(ctx, lockKey, true, 60*time.Second).Err(); err != nil {
2021-07-09 00:26:01 +00:00
logger.WithFields(logrus.Fields{
2021-07-09 01:44:06 +00:00
"lockKey": lockKey,
"err": err,
2021-07-09 00:26:01 +00:00
}).Error("failed to lock account")
}
2021-07-09 02:09:14 +00:00
if err = queue.Publish(payload); err != nil {
logger.WithFields(logrus.Fields{
"accountID": payload,
"err": err,
}).Error("failed to enqueue account")
failed++
} else {
enqueued++
}
2021-07-08 23:03:46 +00:00
}
2021-07-09 02:09:14 +00:00
statsd.Histogram("apollo.queue.enqueued", float64(enqueued), []string{}, 1)
statsd.Histogram("apollo.queue.skipped", float64(skipped), []string{}, 1)
statsd.Histogram("apollo.queue.failed", float64(failed), []string{}, 1)
2021-07-09 02:15:28 +00:00
statsd.Histogram("apollo.queue.runtime", float64(time.Now().Sub(start).Milliseconds()), []string{}, 1)
2021-07-09 02:09:14 +00:00
2021-07-08 23:03:46 +00:00
logger.WithFields(logrus.Fields{
2021-07-09 00:26:01 +00:00
"count": enqueued,
"skipped": skipped,
2021-07-09 02:09:14 +00:00
"failed": failed,
2021-07-09 02:15:28 +00:00
"start": left,
"end": right,
2021-07-09 00:17:20 +00:00
}).Info("done enqueueing account batch")
2021-07-08 23:03:46 +00:00
}
func logErrors(errChan <-chan error) {
for err := range errChan {
log.Print("error: ", err)
}
}