Skip to content

Commit 0634e74

Browse files
committed
refactor: new ggml type
Signed-off-by: thxCode <[email protected]>
1 parent 10321ae commit 0634e74

4 files changed

+24
-6
lines changed

file_metadata.go

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -111,6 +111,8 @@ const (
111111
GGUFFileTypeMostlyTQ1_0 // TQ1_0
112112
GGUFFileTypeMostlyTQ2_0 // TQ2_0
113113
GGUFFileTypeMostlyIQ4_NL_4_4 // IQ4_NL_4x4
114+
GGUFFileTypeMostlyIQ4_NL_4_8 // IQ4_NL_4x8
115+
GGUFFileTypeMostlyIQ4_NL_8_8 // IQ4_NL_8x8
114116
_GGUFFileTypeCount // Unknown
115117
)
116118

@@ -274,6 +276,10 @@ func (t GGUFFileType) GGMLType() GGMLType {
274276
return GGMLTypeTQ2_0
275277
case GGUFFileTypeMostlyIQ4_NL_4_4:
276278
return GGMLTypeIQ4_NL_4_4
279+
case GGUFFileTypeMostlyIQ4_NL_4_8:
280+
return GGMLTypeIQ4_NL_4_8
281+
case GGUFFileTypeMostlyIQ4_NL_8_8:
282+
return GGMLTypeIQ4_NL_8_8
277283
default:
278284
}
279285
return _GGMLTypeCount
@@ -396,6 +402,10 @@ func GetFileType(cm map[GGMLType]int) GGUFFileType {
396402
return GGUFFileTypeMostlyTQ2_0
397403
case GGMLTypeIQ4_NL_4_4:
398404
return GGUFFileTypeMostlyIQ4_NL_4_4
405+
case GGMLTypeIQ4_NL_4_8:
406+
return GGUFFileTypeMostlyIQ4_NL_4_8
407+
case GGMLTypeIQ4_NL_8_8:
408+
return GGUFFileTypeMostlyIQ4_NL_8_8
399409
default:
400410
}
401411
return _GGUFFileTypeCount

ggml.go

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -62,6 +62,8 @@ const (
6262
GGMLTypeTQ1_0
6363
GGMLTypeTQ2_0
6464
GGMLTypeIQ4_NL_4_4
65+
GGMLTypeIQ4_NL_4_8
66+
GGMLTypeIQ4_NL_8_8
6567
_GGMLTypeCount // Unknown
6668
)
6769

@@ -104,6 +106,8 @@ var _GGMLTypeTraits = map[GGMLType]GGMLTypeTrait{
104106
GGMLTypeTQ1_0: {BlockSize: 256, TypeSize: 54, Quantized: true},
105107
GGMLTypeTQ2_0: {BlockSize: 256, TypeSize: 66, Quantized: true},
106108
GGMLTypeIQ4_NL_4_4: {BlockSize: 32, TypeSize: 18, Quantized: true},
109+
GGMLTypeIQ4_NL_4_8: {BlockSize: 32, TypeSize: 18, Quantized: true},
110+
GGMLTypeIQ4_NL_8_8: {BlockSize: 32, TypeSize: 18, Quantized: true},
107111
}
108112

109113
// Trait returns the GGMLTypeTrait of the GGMLType.

zz_generated.ggmltype.stringer.go

Lines changed: 5 additions & 3 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

zz_generated.gguffiletype.stringer.go

Lines changed: 5 additions & 3 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

0 commit comments

Comments
 (0)