agola/internal/services/scheduler/scheduler.go
Simone Gotti e46766829c runservice: rework store and readdb logic
* Remove all the small index files on the lts
* Keep on s3 only a full index of all runs containing the runid, grouppath and phase
  million of runs can take only some hundred of megabytes
* Periodically create a new dump of the index
2019-03-29 12:15:48 +01:00

132 lines
3.5 KiB
Go

// Copyright 2019 Sorint.lab
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied
// See the License for the specific language governing permissions and
// limitations under the License.
package scheduler
import (
"context"
"fmt"
"time"
slog "github.com/sorintlab/agola/internal/log"
"github.com/sorintlab/agola/internal/services/config"
rsapi "github.com/sorintlab/agola/internal/services/runservice/scheduler/api"
"github.com/pkg/errors"
"go.uber.org/zap"
"go.uber.org/zap/zapcore"
)
var level = zap.NewAtomicLevelAt(zapcore.InfoLevel)
var logger = slog.New(level)
var log = logger.Sugar()
func (s *Scheduler) scheduleLoop(ctx context.Context) {
for {
if err := s.schedule(ctx); err != nil {
log.Errorf("err: %+v", err)
}
time.Sleep(1 * time.Second)
}
}
func (s *Scheduler) schedule(ctx context.Context) error {
// create a list of project and users with queued runs
groups := map[string]struct{}{}
var lastRunID string
for {
queuedRunsResponse, _, err := s.runserviceClient.GetQueuedRuns(ctx, lastRunID, 0)
if err != nil {
return errors.Wrapf(err, "failed to get queued runs")
}
//log.Infof("queuedRuns: %s", util.Dump(queuedRunsResponse.Runs))
for _, run := range queuedRunsResponse.Runs {
groups[run.Group] = struct{}{}
}
if len(queuedRunsResponse.Runs) == 0 {
break
}
if len(queuedRunsResponse.Runs) > 0 {
lastRunID = queuedRunsResponse.Runs[len(queuedRunsResponse.Runs)-1].ID
}
}
for groupID := range groups {
if err := s.scheduleRun(ctx, groupID); err != nil {
log.Errorf("scheduler err: %v", err)
}
}
return nil
}
func (s *Scheduler) scheduleRun(ctx context.Context, groupID string) error {
// get first queued run
queuedRunsResponse, _, err := s.runserviceClient.GetGroupFirstQueuedRuns(ctx, groupID, nil)
//log.Infof("first queuedRuns: %s", util.Dump(queuedRunsResponse.Runs))
if err != nil {
return errors.Wrapf(err, "failed to get the first project queued run")
}
if len(queuedRunsResponse.Runs) == 0 {
return nil
}
//log.Infof("queued runs: %s", queuedRunsResponse.Runs)
run := queuedRunsResponse.Runs[0]
runningRunsResponse, _, err := s.runserviceClient.GetGroupRunningRuns(ctx, groupID, 1, []string{fmt.Sprintf("changegroup-%s", groupID)})
if err != nil {
return errors.Wrapf(err, "failed to get running runs")
}
//log.Infof("running Runs: %s", util.Dump(runningRunsResponse.Runs))
if len(runningRunsResponse.Runs) == 0 {
log.Infof("starting run %s", run.ID)
log.Infof("changegroups: %s", runningRunsResponse.ChangeGroupsUpdateToken)
if _, err := s.runserviceClient.StartRun(ctx, run.ID, runningRunsResponse.ChangeGroupsUpdateToken); err != nil {
log.Errorf("failed to start run %s: %v", run.ID, err)
}
}
return nil
}
type Scheduler struct {
c *config.Scheduler
runserviceClient *rsapi.Client
}
func NewScheduler(c *config.Scheduler) (*Scheduler, error) {
if c.Debug {
level.SetLevel(zapcore.DebugLevel)
}
return &Scheduler{
runserviceClient: rsapi.NewClient(c.RunServiceURL),
}, nil
}
func (s *Scheduler) Run(ctx context.Context) error {
go s.scheduleLoop(ctx)
select {
case <-ctx.Done():
log.Infof("scheduler exiting")
return nil
}
}