|
| 1 | +package runner |
| 2 | + |
| 3 | +import ( |
| 4 | + "context" |
| 5 | + "flag" |
| 6 | + "net/http" |
| 7 | + |
| 8 | + "github.com/llm-d/llm-d-inference-scheduler/pkg/batch" |
| 9 | + "github.com/llm-d/llm-d-inference-scheduler/pkg/batch/redis" |
| 10 | + uberzap "go.uber.org/zap" |
| 11 | + "go.uber.org/zap/zapcore" |
| 12 | + ctrl "sigs.k8s.io/controller-runtime" |
| 13 | + "sigs.k8s.io/controller-runtime/pkg/log/zap" |
| 14 | + "sigs.k8s.io/gateway-api-inference-extension/pkg/epp/util/logging" |
| 15 | +) |
| 16 | + |
| 17 | +type Runner struct { |
| 18 | +} |
| 19 | + |
| 20 | +var ( |
| 21 | + setupLog = ctrl.Log.WithName("setup") |
| 22 | + logVerbosity = flag.Int("v", logging.DEFAULT, "number for the log level verbosity") |
| 23 | + concurrency = flag.Int("concurrency", 8, "number of concurrent workers") |
| 24 | + endpoint = flag.String("endpoint", "", "inference endpoint") |
| 25 | +) |
| 26 | + |
| 27 | +func NewRunner() *Runner { |
| 28 | + return &Runner{} |
| 29 | +} |
| 30 | + |
| 31 | +func (r *Runner) Run(ctx context.Context) error { |
| 32 | + opts := zap.Options{ |
| 33 | + Development: true, |
| 34 | + } |
| 35 | + opts.BindFlags(flag.CommandLine) |
| 36 | + flag.Parse() |
| 37 | + initLogging(&opts) |
| 38 | + |
| 39 | + /*if *tracing { |
| 40 | + err := common.InitTracing(ctx, setupLog) |
| 41 | + if err != nil { |
| 42 | + return err |
| 43 | + } |
| 44 | + }*/ |
| 45 | + |
| 46 | + ////////setupLog.Info("GIE build", "commit-sha", version.CommitSHA, "build-ref", version.BuildRef) |
| 47 | + |
| 48 | + // Validate flags |
| 49 | + if err := validateFlags(); err != nil { |
| 50 | + setupLog.Error(err, "Failed to validate flags") |
| 51 | + return err |
| 52 | + } |
| 53 | + |
| 54 | + // Print all flag values |
| 55 | + flags := make(map[string]any) |
| 56 | + flag.VisitAll(func(f *flag.Flag) { |
| 57 | + flags[f.Name] = f.Value |
| 58 | + }) |
| 59 | + setupLog.Info("Flags processed", "flags", flags) |
| 60 | + |
| 61 | + httpClient := &http.Client{ |
| 62 | + // TODO: configure |
| 63 | + } |
| 64 | + var policy batch.RequestPolicy = batch.NewRandomRobinPolicy() |
| 65 | + |
| 66 | + var impl batch.Flow = redis.NewRedisMQFlow("localhost:6379") |
| 67 | + requestChannel := policy.MergeRequestChannels(impl.RequestChannels()).Channel |
| 68 | + for w := 1; w <= *concurrency; w++ { |
| 69 | + go batch.Worker(ctx, *endpoint, httpClient, requestChannel, impl.RetryChannel(), impl.ResultChannel()) |
| 70 | + } |
| 71 | + |
| 72 | + impl.Start(ctx) |
| 73 | + |
| 74 | + return nil |
| 75 | +} |
| 76 | + |
| 77 | +// TODO: is this dup of |
| 78 | +func initLogging(opts *zap.Options) { |
| 79 | + // Unless -zap-log-level is explicitly set, use -v |
| 80 | + useV := true |
| 81 | + flag.Visit(func(f *flag.Flag) { |
| 82 | + if f.Name == "zap-log-level" { |
| 83 | + useV = false |
| 84 | + } |
| 85 | + }) |
| 86 | + if useV { |
| 87 | + // See https://pkg.go.dev/sigs.k8s.io/controller-runtime/pkg/log/zap#Options.Level |
| 88 | + lvl := -1 * (*logVerbosity) |
| 89 | + opts.Level = uberzap.NewAtomicLevelAt(zapcore.Level(int8(lvl))) |
| 90 | + } |
| 91 | + |
| 92 | + logger := zap.New(zap.UseFlagOptions(opts), zap.RawZapOpts(uberzap.AddCaller())) |
| 93 | + ctrl.SetLogger(logger) |
| 94 | +} |
| 95 | + |
| 96 | +func validateFlags() error { |
| 97 | + |
| 98 | + return nil |
| 99 | +} |
0 commit comments