docker
diff --git a/‎cmd/cli/commands/compose.go‎
Lines changed: 12 additions & 6 deletions b/‎cmd/cli/commands/compose.go‎
Lines changed: 12 additions & 6 deletions
diff --git a/‎cmd/cli/commands/configure.go‎
Lines changed: 8 additions & 2 deletions b/‎cmd/cli/commands/configure.go‎
Lines changed: 8 additions & 2 deletions
diff --git a/‎cmd/cli/commands/package.go‎
Lines changed: 2 additions & 2 deletions b/‎cmd/cli/commands/package.go‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎cmd/mdltool/main.go‎
Lines changed: 1 addition & 1 deletion b/‎cmd/mdltool/main.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pkg/distribution/builder/builder.go‎
Lines changed: 1 addition & 1 deletion b/‎pkg/distribution/builder/builder.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pkg/distribution/internal/mutate/model.go‎
Lines changed: 1 addition & 1 deletion b/‎pkg/distribution/internal/mutate/model.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pkg/distribution/internal/mutate/mutate.go‎
Lines changed: 1 addition & 1 deletion b/‎pkg/distribution/internal/mutate/mutate.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pkg/distribution/internal/mutate/mutate_test.go‎
Lines changed: 1 addition & 1 deletion b/‎pkg/distribution/internal/mutate/mutate_test.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pkg/distribution/internal/store/store_test.go‎
Lines changed: 4 additions & 4 deletions b/‎pkg/distribution/internal/store/store_test.go‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎pkg/distribution/types/config.go‎
Lines changed: 1 addition & 1 deletion b/‎pkg/distribution/types/config.go‎
Lines changed: 1 addition & 1 deletion
@@ -66,7 +66,7 @@ func newUpCommand() *cobra.Command {
 				return err
 			}
 
-			if ctxSize > 0 {
+			if cmd.Flags().Changed("context-size") {
 				sendInfo(fmt.Sprintf("Setting context size to %d", ctxSize))
 			}
 
@@ -82,12 +82,18 @@ func newUpCommand() *cobra.Command {
 			}
 
 			for _, model := range models {
+				configuration := inference.BackendConfiguration{
+					Speculative: speculativeConfig,
+				}
+				if cmd.Flags().Changed("context-size") {
+					//TODO is the context size the same for all models?
+					v := int32(ctxSize)
+					configuration.ContextSize = &v
+				}
+
 				if err := desktopClient.ConfigureBackend(scheduling.ConfigureRequest{
-					Model: model,
-					BackendConfiguration: inference.BackendConfiguration{
-						ContextSize: ctxSize,
-						Speculative: speculativeConfig,
-					},
+					Model:                model,
+					BackendConfiguration: configuration,
 				}); err != nil {
 					configErrFmtString := "failed to configure backend for model %s with context-size %d"
 					_ = sendErrorf(configErrFmtString+": %v", model, ctxSize, err)
 
@@ -17,6 +17,7 @@ func newConfigureCmd() *cobra.Command {
 	var numTokens int
 	var minAcceptanceRate float64
 	var hfOverrides string
+	var contextSize int64
 	var reasoningBudget int64
 
 	c := &cobra.Command{
@@ -34,6 +35,10 @@ func newConfigureCmd() *cobra.Command {
 			return nil
 		},
 		RunE: func(cmd *cobra.Command, args []string) error {
+			if cmd.Flags().Changed("context-size") {
+				v := int32(contextSize)
+				opts.ContextSize = &v
+			}
 			// Build the speculative config if any speculative flags are set
 			if draftModel != "" || numTokens > 0 || minAcceptanceRate > 0 {
 				opts.Speculative = &inference.SpeculativeDecodingConfig{
@@ -64,14 +69,15 @@ func newConfigureCmd() *cobra.Command {
 				if opts.LlamaCpp == nil {
 					opts.LlamaCpp = &inference.LlamaCppConfig{}
 				}
-				opts.LlamaCpp.ReasoningBudget = &reasoningBudget
+				v := int32(reasoningBudget)
+				opts.LlamaCpp.ReasoningBudget = &v
 			}
 			return desktopClient.ConfigureBackend(opts)
 		},
 		ValidArgsFunction: completion.ModelNames(getDesktopClient, -1),
 	}
 
-	c.Flags().Int64Var(&opts.ContextSize, "context-size", -1, "context size (in tokens)")
+	c.Flags().Int64Var(&contextSize, "context-size", 0, "context size (in tokens)")
 	c.Flags().StringVar(&draftModel, "speculative-draft-model", "", "draft model for speculative decoding")
 	c.Flags().IntVar(&numTokens, "speculative-num-tokens", 0, "number of tokens to predict speculatively")
 	c.Flags().Float64Var(&minAcceptanceRate, "speculative-min-acceptance-rate", 0, "minimum acceptance rate for speculative decoding")
 
@@ -284,9 +284,9 @@ func packageModel(cmd *cobra.Command, opts packageOptions) error {
 	distClient := initResult.distClient
 
 	// Set context size
-	if opts.contextSize > 0 {
+	if cmd.Flags().Changed("context-size") {
 		cmd.PrintErrf("Setting context size %d\n", opts.contextSize)
-		pkg = pkg.WithContextSize(opts.contextSize)
+		pkg = pkg.WithContextSize(int32(opts.contextSize))
 	}
 
 	// Add license files
 
@@ -321,7 +321,7 @@ func cmdPackage(args []string) int {
 
 	if contextSize > 0 {
 		fmt.Println("Setting context size:", contextSize)
-		b = b.WithContextSize(contextSize)
+		b = b.WithContextSize(int32(contextSize))
 	}
 
 	if mmproj != "" {
 
@@ -67,7 +67,7 @@ func (b *Builder) WithLicense(path string) (*Builder, error) {
 	}, nil
 }
 
-func (b *Builder) WithContextSize(size uint64) *Builder {
+func (b *Builder) WithContextSize(size int32) *Builder {
 	return &Builder{
 		model:          mutate.ContextSize(b.model, size),
 		originalLayers: b.originalLayers,
 
@@ -16,7 +16,7 @@ type model struct {
 	base            types.ModelArtifact
 	appended        []v1.Layer
 	configMediaType ggcr.MediaType
-	contextSize     *uint64
+	contextSize     *int32
 }
 
 func (m *model) Descriptor() (types.Descriptor, error) {
 
@@ -21,7 +21,7 @@ func ConfigMediaType(mdl types.ModelArtifact, mt ggcr.MediaType) types.ModelArti
 	}
 }
 
-func ContextSize(mdl types.ModelArtifact, cs uint64) types.ModelArtifact {
+func ContextSize(mdl types.ModelArtifact, cs int32) types.ModelArtifact {
 	return &model{
 		base:        mdl,
 		contextSize: &cs,
 
@@ -108,7 +108,7 @@ func TestContextSize(t *testing.T) {
 	if cfg2.ContextSize == nil {
 		t.Fatal("Expected non-nil context")
 	}
-	if *cfg2.ContextSize != uint64(2096) {
+	if *cfg2.ContextSize != 2096 {
 		t.Fatalf("Expected context size of 2096 got %d", *cfg2.ContextSize)
 	}
 }
@@ -1040,7 +1040,7 @@ func TestWriteLightweight(t *testing.T) {
 		}
 
 		// Modify the model's config by changing context size
-		newContextSize := uint64(4096)
+		newContextSize := int32(4096)
 		modifiedModel := mutate.ContextSize(baseModel, newContextSize)
 
 		// Use WriteLightweight to write the modified model
@@ -1135,7 +1135,7 @@ func TestWriteLightweight(t *testing.T) {
 		}
 
 		// Create a variant with different config
-		newContextSize := uint64(8192)
+		newContextSize := int32(8192)
 		variant := mutate.ContextSize(baseModel, newContextSize)
 
 		// Use WriteLightweight with multiple tags
@@ -1213,7 +1213,7 @@ func TestWriteLightweight(t *testing.T) {
 		}
 
 		// Create a variant with different context size
-		newContextSize := uint64(2048)
+		newContextSize := int32(2048)
 		variant := mutate.ContextSize(baseModel, newContextSize)
 
 		// Use WriteLightweight for the variant
@@ -1271,7 +1271,7 @@ func TestWriteLightweight(t *testing.T) {
 
 		// Create multiple variants using WriteLightweight
 		for i := 1; i <= 3; i++ {
-			contextSize := uint64(1024 * i)
+			contextSize := int32(1024 * i)
 			variant := mutate.ContextSize(baseModel, contextSize)
 			tag := fmt.Sprintf("integrity-test:variant%d", i)
 			if err := s.WriteLightweight(variant, []string{tag}); err != nil {
 
@@ -67,7 +67,7 @@ type Config struct {
 	Size         string            `json:"size,omitempty"`
 	GGUF         map[string]string `json:"gguf,omitempty"`
 	Safetensors  map[string]string `json:"safetensors,omitempty"`
-	ContextSize  *uint64           `json:"context_size,omitempty"`
+	ContextSize  *int32            `json:"context_size,omitempty"`
 }
 
 // Descriptor provides metadata about the provenance of the model.
Original file line number	Diff line number	Diff line change
`@@ -321,7 +321,7 @@ func cmdPackage(args []string) int {`
`321`	`321`
`322`	`322`	`if contextSize > 0 {`
`323`	`323`	`fmt.Println("Setting context size:", contextSize)`
`324`		`- b = b.WithContextSize(contextSize)`
	`324`	`+ b = b.WithContextSize(int32(contextSize))`
`325`	`325`	`}`
`326`	`326`
`327`	`327`	`if mmproj != "" {`
Original file line number	Diff line number	Diff line change
`@@ -67,7 +67,7 @@ func (b Builder) WithLicense(path string) (Builder, error) {`
`67`	`67`	`}, nil`
`68`	`68`	`}`
`69`	`69`
`70`		`-func (b Builder) WithContextSize(size uint64) Builder {`
	`70`	`+func (b Builder) WithContextSize(size int32) Builder {`
`71`	`71`	`return &Builder{`
`72`	`72`	`model: mutate.ContextSize(b.model, size),`
`73`	`73`	`originalLayers: b.originalLayers,`
Original file line number	Diff line number	Diff line change
`@@ -16,7 +16,7 @@ type model struct {`
`16`	`16`	`base types.ModelArtifact`
`17`	`17`	`appended []v1.Layer`
`18`	`18`	`configMediaType ggcr.MediaType`
`19`		`- contextSize *uint64`
	`19`	`+ contextSize *int32`
`20`	`20`	`}`
`21`	`21`
`22`	`22`	`func (m *model) Descriptor() (types.Descriptor, error) {`
Original file line number	Diff line number	Diff line change
`@@ -21,7 +21,7 @@ func ConfigMediaType(mdl types.ModelArtifact, mt ggcr.MediaType) types.ModelArti`
`21`	`21`	`}`
`22`	`22`	`}`
`23`	`23`
`24`		`-func ContextSize(mdl types.ModelArtifact, cs uint64) types.ModelArtifact {`
	`24`	`+func ContextSize(mdl types.ModelArtifact, cs int32) types.ModelArtifact {`
`25`	`25`	`return &model{`
`26`	`26`	`base: mdl,`
`27`	`27`	`contextSize: &cs,`
Original file line number	Diff line number	Diff line change
`@@ -108,7 +108,7 @@ func TestContextSize(t *testing.T) {`
`108`	`108`	`if cfg2.ContextSize == nil {`
`109`	`109`	`t.Fatal("Expected non-nil context")`
`110`	`110`	`}`
`111`		`- if *cfg2.ContextSize != uint64(2096) {`
	`111`	`+ if *cfg2.ContextSize != 2096 {`
`112`	`112`	`t.Fatalf("Expected context size of 2096 got %d", *cfg2.ContextSize)`
`113`	`113`	`}`
`114`	`114`	`}`
Original file line number	Diff line number	Diff line change
`@@ -67,7 +67,7 @@ type Config struct {`
`67`	`67`	Size string `json:"size,omitempty"`
`68`	`68`	GGUF map[string]string `json:"gguf,omitempty"`
`69`	`69`	Safetensors map[string]string `json:"safetensors,omitempty"`
`70`		- ContextSize *uint64 `json:"context_size,omitempty"`
	`70`	+ ContextSize *int32 `json:"context_size,omitempty"`
`71`	`71`	`}`
`72`	`72`
`73`	`73`	`// Descriptor provides metadata about the provenance of the model.`