@@ -71,12 +71,6 @@ public class OllamaOptions implements FunctionCallingOptions, ChatOptions, Embed
71
71
*/
72
72
@ JsonProperty ("num_batch" ) private Integer numBatch ;
73
73
74
- /**
75
- * The number of GQA groups in the transformer layer. Required for some models,
76
- * for example it is 8 for llama2:70b.
77
- */
78
- @ JsonProperty ("num_gqa" ) private Integer numGQA ;
79
-
80
74
/**
81
75
* The number of layers to send to the GPU(s). On macOS, it defaults to 1
82
76
* to enable metal support, 0 to disable.
@@ -327,11 +321,6 @@ public OllamaOptions withNumBatch(Integer numBatch) {
327
321
return this ;
328
322
}
329
323
330
- public OllamaOptions withNumGQA (Integer numGQA ) {
331
- this .numGQA = numGQA ;
332
- return this ;
333
- }
334
-
335
324
public OllamaOptions withNumGPU (Integer numGPU ) {
336
325
this .numGPU = numGPU ;
337
326
return this ;
@@ -518,14 +507,6 @@ public void setNumBatch(Integer numBatch) {
518
507
this .numBatch = numBatch ;
519
508
}
520
509
521
- public Integer getNumGQA () {
522
- return this .numGQA ;
523
- }
524
-
525
- public void setNumGQA (Integer numGQA ) {
526
- this .numGQA = numGQA ;
527
- }
528
-
529
510
public Integer getNumGPU () {
530
511
return this .numGPU ;
531
512
}
@@ -795,7 +776,6 @@ public static OllamaOptions fromOptions(OllamaOptions fromOptions) {
795
776
.withUseNUMA (fromOptions .getUseNUMA ())
796
777
.withNumCtx (fromOptions .getNumCtx ())
797
778
.withNumBatch (fromOptions .getNumBatch ())
798
- .withNumGQA (fromOptions .getNumGQA ())
799
779
.withNumGPU (fromOptions .getNumGPU ())
800
780
.withMainGPU (fromOptions .getMainGPU ())
801
781
.withLowVRAM (fromOptions .getLowVRAM ())
@@ -837,14 +817,13 @@ public boolean equals(Object o) {
837
817
return Objects .equals (model , that .model ) && Objects .equals (format , that .format )
838
818
&& Objects .equals (keepAlive , that .keepAlive ) && Objects .equals (useNUMA , that .useNUMA )
839
819
&& Objects .equals (numCtx , that .numCtx ) && Objects .equals (numBatch , that .numBatch )
840
- && Objects .equals (numGQA , that .numGQA ) && Objects .equals (numGPU , that .numGPU )
841
- && Objects .equals (mainGPU , that .mainGPU ) && Objects .equals (lowVRAM , that .lowVRAM )
842
- && Objects .equals (f16KV , that .f16KV ) && Objects .equals (logitsAll , that .logitsAll )
843
- && Objects .equals (vocabOnly , that .vocabOnly ) && Objects .equals (useMMap , that .useMMap )
844
- && Objects .equals (useMLock , that .useMLock ) && Objects .equals (numThread , that .numThread )
845
- && Objects .equals (numKeep , that .numKeep ) && Objects .equals (seed , that .seed )
846
- && Objects .equals (numPredict , that .numPredict ) && Objects .equals (topK , that .topK )
847
- && Objects .equals (topP , that .topP ) && Objects .equals (tfsZ , that .tfsZ )
820
+ && Objects .equals (numGPU , that .numGPU ) && Objects .equals (mainGPU , that .mainGPU )
821
+ && Objects .equals (lowVRAM , that .lowVRAM ) && Objects .equals (f16KV , that .f16KV )
822
+ && Objects .equals (logitsAll , that .logitsAll ) && Objects .equals (vocabOnly , that .vocabOnly )
823
+ && Objects .equals (useMMap , that .useMMap ) && Objects .equals (useMLock , that .useMLock )
824
+ && Objects .equals (numThread , that .numThread ) && Objects .equals (numKeep , that .numKeep )
825
+ && Objects .equals (seed , that .seed ) && Objects .equals (numPredict , that .numPredict )
826
+ && Objects .equals (topK , that .topK ) && Objects .equals (topP , that .topP ) && Objects .equals (tfsZ , that .tfsZ )
848
827
&& Objects .equals (typicalP , that .typicalP ) && Objects .equals (repeatLastN , that .repeatLastN )
849
828
&& Objects .equals (temperature , that .temperature ) && Objects .equals (repeatPenalty , that .repeatPenalty )
850
829
&& Objects .equals (presencePenalty , that .presencePenalty )
@@ -858,7 +837,7 @@ public boolean equals(Object o) {
858
837
@ Override
859
838
public int hashCode () {
860
839
return Objects .hash (this .model , this .format , this .keepAlive , this .useNUMA , this .numCtx , this .numBatch ,
861
- this .numGQA , numGPU , mainGPU , lowVRAM , this .f16KV , this .logitsAll , this .vocabOnly , this .useMMap ,
840
+ this .numGPU , this . mainGPU , lowVRAM , this .f16KV , this .logitsAll , this .vocabOnly , this .useMMap ,
862
841
this .useMLock , this .numThread , this .numKeep , this .seed , this .numPredict , this .topK , this .topP , tfsZ ,
863
842
this .typicalP , this .repeatLastN , this .temperature , this .repeatPenalty , this .presencePenalty ,
864
843
this .frequencyPenalty , this .mirostat , this .mirostatTau , this .mirostatEta , this .penalizeNewline ,
0 commit comments