refactor: migrate the job gc to mananger gc server (#3991)
refactor: migrate the job gc to manager gc server. Signed-off-by: chlins <chlins.zhang@gmail.com>
This commit is contained in:
parent
876fd78080
commit
36c110b358
|
|
@ -0,0 +1,110 @@
|
||||||
|
/*
|
||||||
|
* Copyright 2025 The Dragonfly Authors
|
||||||
|
*
|
||||||
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
* you may not use this file except in compliance with the License.
|
||||||
|
* You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
|
||||||
|
package gc
|
||||||
|
|
||||||
|
import (
|
||||||
|
"encoding/json"
|
||||||
|
"time"
|
||||||
|
|
||||||
|
"gorm.io/gorm"
|
||||||
|
|
||||||
|
logger "d7y.io/dragonfly/v2/internal/dflog"
|
||||||
|
"d7y.io/dragonfly/v2/manager/models"
|
||||||
|
libgc "d7y.io/dragonfly/v2/pkg/gc"
|
||||||
|
)
|
||||||
|
|
||||||
|
const (
|
||||||
|
// DefaultJobGCBatchSize is the default batch size for deleting jobs.
|
||||||
|
DefaultJobGCBatchSize = 5000
|
||||||
|
|
||||||
|
// DefaultJobGCInterval is the default interval for running job GC.
|
||||||
|
DefaultJobGCInterval = time.Hour * 3
|
||||||
|
|
||||||
|
// DefaultJobGCTimeout is the default timeout for running job GC.
|
||||||
|
DefaultJobGCTimeout = time.Hour * 1
|
||||||
|
|
||||||
|
// JohGCTaskID is the ID of the job GC task.
|
||||||
|
JobGCTaskID = "job"
|
||||||
|
)
|
||||||
|
|
||||||
|
func NewJobGCTask(db *gorm.DB) libgc.Task {
|
||||||
|
return libgc.Task{
|
||||||
|
ID: JobGCTaskID,
|
||||||
|
Interval: DefaultJobGCInterval,
|
||||||
|
Timeout: DefaultJobGCTimeout,
|
||||||
|
Runner: &job{db: db, recorder: newJobRecorder(db)},
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// job is the struct for cleaning up jobs which implements the gc Runner interface.
|
||||||
|
type job struct {
|
||||||
|
db *gorm.DB
|
||||||
|
recorder *jobRecorder
|
||||||
|
}
|
||||||
|
|
||||||
|
// RunGC implements the gc Runner interface.
|
||||||
|
func (j *job) RunGC() error {
|
||||||
|
ttl, err := j.getTTL()
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
if err = j.recorder.Init(JobGCTaskID, models.JSONMap{
|
||||||
|
"ttl": ttl,
|
||||||
|
"batch_size": DefaultJobGCBatchSize,
|
||||||
|
}); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
var gcResult Result
|
||||||
|
defer func() {
|
||||||
|
if err := j.recorder.Record(gcResult); err != nil {
|
||||||
|
logger.Errorf("failed to record job GC result: %v", err)
|
||||||
|
}
|
||||||
|
}()
|
||||||
|
|
||||||
|
for {
|
||||||
|
result := j.db.Where("created_at < ?", time.Now().Add(-ttl)).Limit(DefaultJobGCBatchSize).Unscoped().Delete(&models.Job{})
|
||||||
|
if result.Error != nil {
|
||||||
|
gcResult.Error = result.Error
|
||||||
|
return result.Error
|
||||||
|
}
|
||||||
|
|
||||||
|
if result.RowsAffected == 0 {
|
||||||
|
break
|
||||||
|
}
|
||||||
|
|
||||||
|
gcResult.Purged += result.RowsAffected
|
||||||
|
logger.Infof("gc job deleted %d jobs", result.RowsAffected)
|
||||||
|
}
|
||||||
|
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
func (j *job) getTTL() (time.Duration, error) {
|
||||||
|
var config models.Config
|
||||||
|
if err := j.db.Model(models.Config{}).First(&config, &models.Config{Name: models.ConfigGC}).Error; err != nil {
|
||||||
|
return 0, err
|
||||||
|
}
|
||||||
|
|
||||||
|
var gcConfig models.GCConfig
|
||||||
|
if err := json.Unmarshal([]byte(config.Value), &gcConfig); err != nil {
|
||||||
|
return 0, err
|
||||||
|
}
|
||||||
|
|
||||||
|
return gcConfig.Job.TTL, nil
|
||||||
|
}
|
||||||
|
|
@ -0,0 +1,87 @@
|
||||||
|
/*
|
||||||
|
* Copyright 2025 The Dragonfly Authors
|
||||||
|
*
|
||||||
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
* you may not use this file except in compliance with the License.
|
||||||
|
* You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
|
||||||
|
package gc
|
||||||
|
|
||||||
|
import (
|
||||||
|
"errors"
|
||||||
|
|
||||||
|
"gorm.io/gorm"
|
||||||
|
|
||||||
|
"d7y.io/dragonfly/v2/manager/models"
|
||||||
|
)
|
||||||
|
|
||||||
|
const (
|
||||||
|
// GCJobType indicates the gc task is completed successfully.
|
||||||
|
GCJobType = "gc"
|
||||||
|
|
||||||
|
// GCStateSuccess indicates the gc task is completed successfully.
|
||||||
|
GCStateSuccess = "SUCCESS"
|
||||||
|
|
||||||
|
// GCStateFailure indicates the gc task is completed with failure.
|
||||||
|
GCStateFailure = "FAILURE"
|
||||||
|
)
|
||||||
|
|
||||||
|
type Result struct {
|
||||||
|
Error error
|
||||||
|
Purged int64
|
||||||
|
}
|
||||||
|
|
||||||
|
type jobRecorder struct {
|
||||||
|
db *gorm.DB
|
||||||
|
job *models.Job
|
||||||
|
}
|
||||||
|
|
||||||
|
func newJobRecorder(db *gorm.DB) *jobRecorder {
|
||||||
|
return &jobRecorder{
|
||||||
|
db: db,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
func (jb *jobRecorder) Init(taskID string, args models.JSONMap) error {
|
||||||
|
job := models.Job{
|
||||||
|
Type: GCJobType,
|
||||||
|
TaskID: taskID,
|
||||||
|
Args: args,
|
||||||
|
}
|
||||||
|
|
||||||
|
if err := jb.db.Create(&job).Error; err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
jb.job = &job
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
func (jb *jobRecorder) Record(result Result) error {
|
||||||
|
if jb.job == nil {
|
||||||
|
return errors.New("job not found")
|
||||||
|
}
|
||||||
|
|
||||||
|
if jb.job.Result == nil {
|
||||||
|
jb.job.Result = make(models.JSONMap)
|
||||||
|
}
|
||||||
|
|
||||||
|
jb.job.State = GCStateSuccess
|
||||||
|
jb.job.Result["purged"] = result.Purged
|
||||||
|
|
||||||
|
if result.Error != nil {
|
||||||
|
jb.job.State = GCStateFailure
|
||||||
|
jb.job.Result["error"] = result.Error.Error()
|
||||||
|
}
|
||||||
|
|
||||||
|
return jb.db.Save(jb.job).Error
|
||||||
|
}
|
||||||
|
|
@ -1,94 +0,0 @@
|
||||||
/*
|
|
||||||
* Copyright 2024 The Dragonfly Authors
|
|
||||||
*
|
|
||||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
||||||
* you may not use this file except in compliance with the License.
|
|
||||||
* You may obtain a copy of the License at
|
|
||||||
*
|
|
||||||
* http://www.apache.org/licenses/LICENSE-2.0
|
|
||||||
*
|
|
||||||
* Unless required by applicable law or agreed to in writing, software
|
|
||||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
||||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
||||||
* See the License for the specific language governing permissions and
|
|
||||||
* limitations under the License.
|
|
||||||
*/
|
|
||||||
|
|
||||||
//go:generate mockgen -destination mocks/gc_mock.go -source gc.go -package mocks
|
|
||||||
|
|
||||||
package job
|
|
||||||
|
|
||||||
import (
|
|
||||||
"context"
|
|
||||||
"time"
|
|
||||||
|
|
||||||
"gorm.io/gorm"
|
|
||||||
|
|
||||||
logger "d7y.io/dragonfly/v2/internal/dflog"
|
|
||||||
"d7y.io/dragonfly/v2/manager/config"
|
|
||||||
"d7y.io/dragonfly/v2/manager/models"
|
|
||||||
)
|
|
||||||
|
|
||||||
// GC is an interface for gc.
|
|
||||||
type GC interface {
|
|
||||||
// Serve started gc server.
|
|
||||||
Serve()
|
|
||||||
|
|
||||||
// Stop gc server.
|
|
||||||
Stop()
|
|
||||||
}
|
|
||||||
|
|
||||||
// gc is an implementation of GC.
|
|
||||||
type gc struct {
|
|
||||||
config *config.Config
|
|
||||||
db *gorm.DB
|
|
||||||
done chan struct{}
|
|
||||||
}
|
|
||||||
|
|
||||||
// newGC returns a new GC.
|
|
||||||
func newGC(cfg *config.Config, gdb *gorm.DB) (GC, error) {
|
|
||||||
return &gc{
|
|
||||||
config: cfg,
|
|
||||||
db: gdb,
|
|
||||||
done: make(chan struct{}),
|
|
||||||
}, nil
|
|
||||||
}
|
|
||||||
|
|
||||||
// Serve started gc server.
|
|
||||||
func (gc *gc) Serve() {
|
|
||||||
tick := time.NewTicker(gc.config.Job.GC.Interval)
|
|
||||||
for {
|
|
||||||
select {
|
|
||||||
case <-tick.C:
|
|
||||||
logger.Infof("gc job started")
|
|
||||||
if err := gc.deleteInBatches(context.Background()); err != nil {
|
|
||||||
logger.Errorf("gc job failed: %v", err)
|
|
||||||
}
|
|
||||||
case <-gc.done:
|
|
||||||
return
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// Stop gc server.
|
|
||||||
func (gc *gc) Stop() {
|
|
||||||
close(gc.done)
|
|
||||||
}
|
|
||||||
|
|
||||||
// deleteInBatches deletes jobs in batches.
|
|
||||||
func (gc *gc) deleteInBatches(ctx context.Context) error {
|
|
||||||
for {
|
|
||||||
result := gc.db.WithContext(ctx).Where("created_at < ?", time.Now().Add(-gc.config.Job.GC.TTL)).Limit(gc.config.Job.GC.BatchSize).Unscoped().Delete(&models.Job{})
|
|
||||||
if result.Error != nil {
|
|
||||||
return result.Error
|
|
||||||
}
|
|
||||||
|
|
||||||
if result.RowsAffected == 0 {
|
|
||||||
break
|
|
||||||
}
|
|
||||||
|
|
||||||
logger.Infof("gc job deleted %d jobs", result.RowsAffected)
|
|
||||||
}
|
|
||||||
|
|
||||||
return nil
|
|
||||||
}
|
|
||||||
|
|
@ -41,7 +41,6 @@ type Job struct {
|
||||||
Preheat
|
Preheat
|
||||||
SyncPeers
|
SyncPeers
|
||||||
Task
|
Task
|
||||||
GC
|
|
||||||
}
|
}
|
||||||
|
|
||||||
// New returns a new Job.
|
// New returns a new Job.
|
||||||
|
|
@ -78,29 +77,21 @@ func New(cfg *config.Config, gdb *gorm.DB) (*Job, error) {
|
||||||
return nil, err
|
return nil, err
|
||||||
}
|
}
|
||||||
|
|
||||||
gc, err := newGC(cfg, gdb)
|
|
||||||
if err != nil {
|
|
||||||
return nil, err
|
|
||||||
}
|
|
||||||
|
|
||||||
return &Job{
|
return &Job{
|
||||||
Job: j,
|
Job: j,
|
||||||
Preheat: preheat,
|
Preheat: preheat,
|
||||||
SyncPeers: syncPeers,
|
SyncPeers: syncPeers,
|
||||||
Task: newTask(j),
|
Task: newTask(j),
|
||||||
GC: gc,
|
|
||||||
}, nil
|
}, nil
|
||||||
}
|
}
|
||||||
|
|
||||||
// Serve starts the job server.
|
// Serve starts the job server.
|
||||||
func (j *Job) Serve() {
|
func (j *Job) Serve() {
|
||||||
go j.GC.Serve()
|
|
||||||
go j.SyncPeers.Serve()
|
go j.SyncPeers.Serve()
|
||||||
}
|
}
|
||||||
|
|
||||||
// Stop stops the job server.
|
// Stop stops the job server.
|
||||||
func (j *Job) Stop() {
|
func (j *Job) Stop() {
|
||||||
j.GC.Stop()
|
|
||||||
j.SyncPeers.Stop()
|
j.SyncPeers.Stop()
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -34,6 +34,7 @@ import (
|
||||||
"d7y.io/dragonfly/v2/manager/cache"
|
"d7y.io/dragonfly/v2/manager/cache"
|
||||||
"d7y.io/dragonfly/v2/manager/config"
|
"d7y.io/dragonfly/v2/manager/config"
|
||||||
"d7y.io/dragonfly/v2/manager/database"
|
"d7y.io/dragonfly/v2/manager/database"
|
||||||
|
"d7y.io/dragonfly/v2/manager/gc"
|
||||||
"d7y.io/dragonfly/v2/manager/job"
|
"d7y.io/dragonfly/v2/manager/job"
|
||||||
"d7y.io/dragonfly/v2/manager/metrics"
|
"d7y.io/dragonfly/v2/manager/metrics"
|
||||||
"d7y.io/dragonfly/v2/manager/permission/rbac"
|
"d7y.io/dragonfly/v2/manager/permission/rbac"
|
||||||
|
|
@ -42,6 +43,7 @@ import (
|
||||||
"d7y.io/dragonfly/v2/manager/searcher"
|
"d7y.io/dragonfly/v2/manager/searcher"
|
||||||
"d7y.io/dragonfly/v2/manager/service"
|
"d7y.io/dragonfly/v2/manager/service"
|
||||||
"d7y.io/dragonfly/v2/pkg/dfpath"
|
"d7y.io/dragonfly/v2/pkg/dfpath"
|
||||||
|
pkggc "d7y.io/dragonfly/v2/pkg/gc"
|
||||||
"d7y.io/dragonfly/v2/pkg/net/ip"
|
"d7y.io/dragonfly/v2/pkg/net/ip"
|
||||||
"d7y.io/dragonfly/v2/pkg/objectstorage"
|
"d7y.io/dragonfly/v2/pkg/objectstorage"
|
||||||
"d7y.io/dragonfly/v2/pkg/rpc"
|
"d7y.io/dragonfly/v2/pkg/rpc"
|
||||||
|
|
@ -93,6 +95,9 @@ type Server struct {
|
||||||
// Job rate limiter.
|
// Job rate limiter.
|
||||||
jobRateLimiter ratelimiter.JobRateLimiter
|
jobRateLimiter ratelimiter.JobRateLimiter
|
||||||
|
|
||||||
|
// GC server.
|
||||||
|
gc pkggc.GC
|
||||||
|
|
||||||
// GRPC server.
|
// GRPC server.
|
||||||
grpcServer *grpc.Server
|
grpcServer *grpc.Server
|
||||||
|
|
||||||
|
|
@ -157,6 +162,14 @@ func New(cfg *config.Config, d dfpath.Dfpath) (*Server, error) {
|
||||||
return nil, err
|
return nil, err
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Initialize garbage collector.
|
||||||
|
s.gc = pkggc.New()
|
||||||
|
|
||||||
|
// Register job gc task.
|
||||||
|
if err := s.gc.Add(gc.NewJobGCTask(db.DB)); err != nil {
|
||||||
|
return nil, err
|
||||||
|
}
|
||||||
|
|
||||||
// Initialize REST server.
|
// Initialize REST server.
|
||||||
restService := service.New(cfg, db, cache, job, enforcer, objectStorage)
|
restService := service.New(cfg, db, cache, job, enforcer, objectStorage)
|
||||||
router, err := router.Init(cfg, d.LogDir(), restService, db, enforcer, s.jobRateLimiter, EmbedFolder(assets, assetsTargetPath))
|
router, err := router.Init(cfg, d.LogDir(), restService, db, enforcer, s.jobRateLimiter, EmbedFolder(assets, assetsTargetPath))
|
||||||
|
|
@ -253,6 +266,10 @@ func (s *Server) Serve() error {
|
||||||
s.jobRateLimiter.Serve()
|
s.jobRateLimiter.Serve()
|
||||||
}()
|
}()
|
||||||
|
|
||||||
|
// Started gc server.
|
||||||
|
s.gc.Start()
|
||||||
|
logger.Info("started gc server")
|
||||||
|
|
||||||
// Generate GRPC listener.
|
// Generate GRPC listener.
|
||||||
ip, ok := ip.FormatIP(s.config.Server.GRPC.ListenIP.String())
|
ip, ok := ip.FormatIP(s.config.Server.GRPC.ListenIP.String())
|
||||||
if !ok {
|
if !ok {
|
||||||
|
|
@ -299,6 +316,9 @@ func (s *Server) Stop() {
|
||||||
// Stop job rate limiter.
|
// Stop job rate limiter.
|
||||||
s.jobRateLimiter.Stop()
|
s.jobRateLimiter.Stop()
|
||||||
|
|
||||||
|
// Stop gc server.
|
||||||
|
s.gc.Stop()
|
||||||
|
|
||||||
// Stop GRPC server.
|
// Stop GRPC server.
|
||||||
stopped := make(chan struct{})
|
stopped := make(chan struct{})
|
||||||
go func() {
|
go func() {
|
||||||
|
|
|
||||||
|
|
@ -28,12 +28,14 @@ import (
|
||||||
)
|
)
|
||||||
|
|
||||||
const (
|
const (
|
||||||
// auditBatchInsertSize is the size for batch insertion.
|
// AuditBufferSize is the size of the audit channel buffer.
|
||||||
auditBatchInsertSize = 500
|
AuditBufferSize = 1000
|
||||||
// auditBatchInsertInterval is the interval for batch insertion.
|
|
||||||
auditBatchInsertInterval = 5 * time.Second
|
// AuditInsertBatchSize is the size for batch insertion.
|
||||||
// auditBufferSize is the size of the audit channel buffer.
|
AuditInsertBatchSize = 500
|
||||||
auditBufferSize = 1000
|
|
||||||
|
// AuditInsertInterval is the interval for batch insertion.
|
||||||
|
AuditInsertInterval = time.Second * 5
|
||||||
)
|
)
|
||||||
|
|
||||||
var (
|
var (
|
||||||
|
|
@ -43,7 +45,7 @@ var (
|
||||||
|
|
||||||
func (s *service) AsyncCreateAudit(ctx context.Context, json *types.CreateAuditRequest) error {
|
func (s *service) AsyncCreateAudit(ctx context.Context, json *types.CreateAuditRequest) error {
|
||||||
once.Do(func() {
|
once.Do(func() {
|
||||||
auditCh = make(chan *models.Audit, auditBufferSize)
|
auditCh = make(chan *models.Audit, AuditBufferSize)
|
||||||
go s.processAudit()
|
go s.processAudit()
|
||||||
})
|
})
|
||||||
|
|
||||||
|
|
@ -67,7 +69,7 @@ func (s *service) AsyncCreateAudit(ctx context.Context, json *types.CreateAuditR
|
||||||
return nil
|
return nil
|
||||||
default:
|
default:
|
||||||
// Avoid to hang out the AsyncCreateAudit if the buffer is full.
|
// Avoid to hang out the AsyncCreateAudit if the buffer is full.
|
||||||
return fmt.Errorf("audit buffer is full, buffer size: %d, drop the audit %#v", auditBufferSize, audit)
|
return fmt.Errorf("audit buffer is full, buffer size: %d, drop the audit %#v", AuditBufferSize, audit)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
@ -75,8 +77,8 @@ func (s *service) AsyncCreateAudit(ctx context.Context, json *types.CreateAuditR
|
||||||
func (s *service) processAudit() {
|
func (s *service) processAudit() {
|
||||||
// Use the new context as this is asynchronous operation.
|
// Use the new context as this is asynchronous operation.
|
||||||
ctx := context.Background()
|
ctx := context.Background()
|
||||||
audits := make([]*models.Audit, 0, auditBatchInsertSize)
|
audits := make([]*models.Audit, 0, AuditInsertBatchSize)
|
||||||
ticker := time.NewTicker(auditBatchInsertInterval)
|
ticker := time.NewTicker(AuditInsertInterval)
|
||||||
defer ticker.Stop()
|
defer ticker.Stop()
|
||||||
|
|
||||||
createAuditInBatch := func(ctx context.Context, audits []*models.Audit) error {
|
createAuditInBatch := func(ctx context.Context, audits []*models.Audit) error {
|
||||||
|
|
@ -101,17 +103,17 @@ func (s *service) processAudit() {
|
||||||
}
|
}
|
||||||
|
|
||||||
audits = append(audits, audit)
|
audits = append(audits, audit)
|
||||||
if len(audits) >= auditBatchInsertSize {
|
if len(audits) >= AuditInsertBatchSize {
|
||||||
if err := createAuditInBatch(ctx, audits); err == nil {
|
if err := createAuditInBatch(ctx, audits); err == nil {
|
||||||
audits = make([]*models.Audit, 0, auditBatchInsertSize)
|
audits = make([]*models.Audit, 0, AuditInsertBatchSize)
|
||||||
}
|
}
|
||||||
|
|
||||||
ticker.Reset(auditBatchInsertInterval)
|
ticker.Reset(AuditInsertInterval)
|
||||||
}
|
}
|
||||||
case <-ticker.C:
|
case <-ticker.C:
|
||||||
if len(audits) > 0 {
|
if len(audits) > 0 {
|
||||||
if err := createAuditInBatch(ctx, audits); err == nil {
|
if err := createAuditInBatch(ctx, audits); err == nil {
|
||||||
audits = make([]*models.Audit, 0, auditBatchInsertSize)
|
audits = make([]*models.Audit, 0, AuditInsertBatchSize)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue