block · alecthomas · Jan 20, 2026 · Jan 20, 2026
@@ -10,11 +10,15 @@ test:
 
 # Lint code
 lint:
-    golangci-lint run
-    actionlint
+    #!/bin/bash
+    golangci-lint run &
+    actionlint &
+    wait
 
 # Format code
 fmt:
-    just --unstable --fmt
-    golangci-lint fmt
-    go mod tidy
+    #!/bin/bash
+    just --unstable --fmt &
+    golangci-lint fmt &
+    go mod tidy &
+    wait
@@ -1 +1 @@
-.golangci-lint-2.8.0.pkg
+.golangci-lint-2.7.2.pkg
@@ -11,6 +11,7 @@
 git {
   mirror-root = "./state/git-mirrors"
   clone-depth = 1000
+  bundle-interval = "24h"
 }
 
 host "https://w3.org" {}
@@ -20,8 +21,8 @@ github-releases {
   private-orgs = ["alecthomas"]
 }
 
-memory {}
-
 disk {
   root = "./state/cache"
+  limit-mb = 250000
+  max-ttl = "8h"
 }
@@ -0,0 +1,155 @@
+// Package jobscheduler provides a means to schedule work across multiple queues while limiting overall work.
+package jobscheduler
+
+import (
+	"context"
+	"fmt"
+	"runtime"
+	"sync"
+	"time"
+
+	"github.com/alecthomas/errors"
+
+	"github.com/block/cachew/internal/logging"
+)
+
+type Config struct {
+	Concurrency int `hcl:"concurrency" help:"The maximum number of concurrent jobs to run (0 means number of cores)." default:"0"`
+}
+
+type queueJob struct {
+	id    string
+	queue string
+	run   func(ctx context.Context) error
+}
+
+func (j *queueJob) String() string                { return fmt.Sprintf("job-%s-%s", j.queue, j.id) }
+func (j *queueJob) Run(ctx context.Context) error { return errors.WithStack(j.run(ctx)) }
+
+type Scheduler interface {
+	Submit(queue, id string, run func(ctx context.Context) error)
+	SubmitPeriodicJob(queue, id string, interval time.Duration, run func(ctx context.Context) error)
+}
+
+type PrefixedScheduler struct {
+	prefix    string
+	scheduler Scheduler
+}
+
+func (ps *PrefixedScheduler) Submit(queue, id string, run func(ctx context.Context) error) {
+	ps.scheduler.Submit(ps.prefix+queue, id, run)
+}
+
+func (ps *PrefixedScheduler) SubmitPeriodicJob(queue, id string, interval time.Duration, run func(ctx context.Context) error) {
+	ps.scheduler.SubmitPeriodicJob(ps.prefix+queue, id, interval, run)
+}
+
+// RootScheduler runs jobs from multiple queues.
+//
+// Its primary role is to rate limit concurrent background tasks so that we don't DoS the host when, for example,
+// generating git snapshots, GCing git repos, etc.
+type RootScheduler struct {
+	workAvailable chan bool
+	lock          sync.Mutex
+	queue         []queueJob
+	active        map[string]bool
+	cancel        context.CancelFunc
+}
+
+var _ Scheduler = &RootScheduler{}
+
+// New creates a new JobScheduler.
+func New(ctx context.Context, config Config) Scheduler {
+	if config.Concurrency == 0 {
+		config.Concurrency = runtime.NumCPU()
+	}
+	q := &RootScheduler{
+		workAvailable: make(chan bool, 1024),
+		active:        make(map[string]bool),
+	}
+	ctx, cancel := context.WithCancel(ctx)
+	q.cancel = cancel
+	for id := range config.Concurrency {
+		go q.worker(ctx, id)
+	}
+	return q
+}
+
+// WithQueuePrefix creates a new Scheduler that prefixes all queue names with the given prefix.
+//
+// This is useful to avoid collisions across strategies.
+func (q *RootScheduler) WithQueuePrefix(prefix string) Scheduler {
+	return &PrefixedScheduler{
+		prefix:    prefix,
+		scheduler: q,
+	}
+}
+
+// Submit a job to the queue.
+//
+// Jobs run concurrently across queues, but never within a queue.
+func (q *RootScheduler) Submit(queue, id string, run func(ctx context.Context) error) {
+	q.lock.Lock()
+	defer q.lock.Unlock()
+	q.queue = append(q.queue, queueJob{queue: queue, id: id, run: run})
+	q.workAvailable <- true
+}
+
+// SubmitPeriodicJob submits a job to the queue that runs immediately, and then periodically after the interval.
+//
+// Jobs run concurrently across queues, but never within a queue.
+func (q *RootScheduler) SubmitPeriodicJob(queue, description string, interval time.Duration, run func(ctx context.Context) error) {
+	q.Submit(queue, description, func(ctx context.Context) error {
+		err := run(ctx)
+		go func() {
+			time.Sleep(interval)
+			q.SubmitPeriodicJob(queue, description, interval, run)
+		}()
+		return errors.WithStack(err)
+	})
+}
+
+func (q *RootScheduler) worker(ctx context.Context, id int) {
+	logger := logging.FromContext(ctx).With("scheduler-worker", id)
+	for {
+		select {
+		case <-ctx.Done():
+			logger.InfoContext(ctx, "Worker terminated")
+			return
+
+		case <-q.workAvailable:
+			job, ok := q.takeNextJob()
+			if !ok {
+				continue
+			}
+			jlogger := logger.With("job", job.String())
+			jlogger.InfoContext(ctx, "Running job")
+			if err := job.run(ctx); err != nil {
+				jlogger.ErrorContext(ctx, "Job failed", "error", err)
+			}
+			q.markQueueInactive(job.queue)
+			q.workAvailable <- true
+		}
+	}
+}
+
+func (q *RootScheduler) markQueueInactive(queue string) {
+	q.lock.Lock()
+	defer q.lock.Unlock()
+	delete(q.active, queue)
+}
+
+// Take the next job for any queue that is not already running a job.
+func (q *RootScheduler) takeNextJob() (queueJob, bool) {
+	q.lock.Lock()
+	defer q.lock.Unlock()
+	for i, job := range q.queue {
+		if !q.active[job.queue] {
+			q.queue = append(q.queue[:i], q.queue[i+1:]...)
+			q.workAvailable <- true
+			q.active[job.queue] = true
+			return job, true
+		}
+	}
+	return queueJob{}, false
+}