livepeer · rickstaa · Apr 16, 2024 · Apr 15, 2024 · Apr 16, 2024 · Apr 16, 2024
@@ -18,6 +18,7 @@ import (
 	"path/filepath"
 	"strconv"
 	"strings"
+	"sync"
 	"time"
 
 	ethcommon "github.com/ethereum/go-ethereum/common"
@@ -538,19 +539,27 @@ func StartLivepeer(ctx context.Context, cfg LivepeerConfig) {
 				return
 			}
 
+			var once sync.Once
 			for _, config := range configs {
 				modelConstraint := &core.ModelConstraint{Warm: config.Warm}
 
 				// If the config contains a URL we call Warm() anyway because AIWorker will just register
 				// the endpoint for an external container
 				if config.Warm || config.URL != "" {
 					endpoint := worker.RunnerEndpoint{URL: config.URL, Token: config.Token}
-					if err := n.AIWorker.Warm(ctx, config.Pipeline, config.ModelID, endpoint); err != nil {
+					if err := n.AIWorker.Warm(ctx, config.Pipeline, config.ModelID, endpoint, config.OptimizationFlags); err != nil {
 						glog.Errorf("Error AI worker warming %v container: %v", config.Pipeline, err)
 						return
 					}
 				}
 
+				// Show warning if people set OptimizationFlags but not Warm.
+				if len(config.OptimizationFlags) > 0 && !config.Warm {
+					once.Do(func() {
+						glog.Warningf("OptimizationFlags set for model %v but Warm is not set. OptimizationFlags are currently only used for warm containers.", config.ModelID)
+					})
+				}
+
 				switch config.Pipeline {
 				case "text-to-image":
 					_, ok := constraints[core.Capability_TextToImage]

@@ -15,18 +15,19 @@
 	TextToImage(context.Context, worker.TextToImageJSONRequestBody) (*worker.ImageResponse, error)
 	ImageToImage(context.Context, worker.ImageToImageMultipartRequestBody) (*worker.ImageResponse, error)
 	ImageToVideo(context.Context, worker.ImageToVideoMultipartRequestBody) (*worker.VideoResponse, error)
-	Warm(context.Context, string, string, worker.RunnerEndpoint) error
+	Warm(context.Context, string, string, worker.RunnerEndpoint, worker.OptimizationFlags) error
 	Stop(context.Context) error
 }
 
 type AIModelConfig struct {
-	Pipeline      string `json:"pipeline"`
-	ModelID       string `json:"model_id"`
-	URL           string `json:"url,omitempty"`
-	Token         string `json:"token,omitempty"`
-	Warm          bool   `json:"warm,omitempty"`
-	PricePerUnit  int64  `json:"price_per_unit,omitempty"`
-	PixelsPerUnit int64  `json:"pixels_per_unit,omitempty"`
+	Pipeline          string                   `json:"pipeline"`
+	ModelID           string                   `json:"model_id"`
+	URL               string                   `json:"url,omitempty"`
+	Token             string                   `json:"token,omitempty"`
+	Warm              bool                     `json:"warm,omitempty"`
+	PricePerUnit      int64                    `json:"price_per_unit,omitempty"`
+	PixelsPerUnit     int64                    `json:"pixels_per_unit,omitempty"`
+	OptimizationFlags worker.OptimizationFlags `json:"optimization_flags,omitempty"`
 }
 
 func (config *AIModelConfig) UnmarshalJSON(data []byte) error {