File tree Expand file tree Collapse file tree 4 files changed +16
-5
lines changed Expand file tree Collapse file tree 4 files changed +16
-5
lines changed Original file line number Diff line number Diff line change @@ -65,5 +65,6 @@ async function DebugCmakeOptionsFunction() {
6565 console . info ( ) ;
6666
6767 console . info ( `${ chalk . yellow ( "CMake options:" ) } ${ prettyPrintObject ( llama . cmakeOptions ) } ` ) ;
68+ console . info ( `${ chalk . yellow ( "Release:" ) } ${ prettyPrintObject ( llama . llamaCppRelease ) } ` ) ;
6869}
6970
Original file line number Diff line number Diff line change @@ -122,7 +122,7 @@ export async function interactivelyAskForModel({
122122
123123 const compatibilityScore = await ggufInsights ?. configurationResolver . scoreModelConfigurationCompatibility ( {
124124 flashAttention : flashAttention && ggufInsights ?. flashAttentionSupported ,
125- swaFullCache : swaFullCache ,
125+ swaFullCache,
126126 useMmap
127127 } ) ;
128128
Original file line number Diff line number Diff line change @@ -135,8 +135,8 @@ export enum GgufFileType {
135135 MOSTLY_Q4_0_4_4 = 33 , // deprecated
136136 MOSTLY_Q4_0_4_8 = 34 , // deprecated
137137 MOSTLY_Q4_0_8_8 = 35 , // deprecated
138- MOSTLY_TQ1_0 = 36 , // deprecated
139- MOSTLY_TQ2_0 = 37 // deprecated
138+ MOSTLY_TQ1_0 = 36 ,
139+ MOSTLY_TQ2_0 = 37
140140}
141141
142142
Original file line number Diff line number Diff line change @@ -6,7 +6,7 @@ export type GgufTensorInfo = {
66
77 /**
88 * Adjusted offset relative to the file.
9- *
9+ *
1010 * Added by the GGUF parser - not part of the file's metadata.
1111 */
1212 readonly fileOffset : number | bigint ,
@@ -49,5 +49,15 @@ export const enum GgmlType {
4949 I16 = 25 ,
5050 I32 = 26 ,
5151 I64 = 27 ,
52- F64 = 28
52+ F64 = 28 ,
53+ IQ1_M = 29 ,
54+ BF16 = 30 ,
55+ Q4_0_4_4 = 31 ,
56+ Q4_0_4_8 = 32 ,
57+ Q4_0_8_8 = 33 ,
58+ TQ1_0 = 34 ,
59+ TQ2_0 = 35 ,
60+ IQ4_NL_4_4 = 36 ,
61+ IQ4_NL_4_8 = 37 ,
62+ IQ4_NL_8_8 = 38 ,
5363}
You can’t perform that action at this time.
0 commit comments