Skip to content

Commit

Permalink
refactor: new ggml type
Browse files Browse the repository at this point in the history
Signed-off-by: thxCode <[email protected]>
  • Loading branch information
thxCode committed Dec 9, 2024
1 parent 10321ae commit 0634e74
Show file tree
Hide file tree
Showing 4 changed files with 24 additions and 6 deletions.
10 changes: 10 additions & 0 deletions file_metadata.go
Original file line number Diff line number Diff line change
Expand Up @@ -111,6 +111,8 @@ const (
GGUFFileTypeMostlyTQ1_0 // TQ1_0
GGUFFileTypeMostlyTQ2_0 // TQ2_0
GGUFFileTypeMostlyIQ4_NL_4_4 // IQ4_NL_4x4
GGUFFileTypeMostlyIQ4_NL_4_8 // IQ4_NL_4x8
GGUFFileTypeMostlyIQ4_NL_8_8 // IQ4_NL_8x8
_GGUFFileTypeCount // Unknown
)

Expand Down Expand Up @@ -274,6 +276,10 @@ func (t GGUFFileType) GGMLType() GGMLType {
return GGMLTypeTQ2_0
case GGUFFileTypeMostlyIQ4_NL_4_4:
return GGMLTypeIQ4_NL_4_4
case GGUFFileTypeMostlyIQ4_NL_4_8:
return GGMLTypeIQ4_NL_4_8
case GGUFFileTypeMostlyIQ4_NL_8_8:
return GGMLTypeIQ4_NL_8_8
default:
}
return _GGMLTypeCount
Expand Down Expand Up @@ -396,6 +402,10 @@ func GetFileType(cm map[GGMLType]int) GGUFFileType {
return GGUFFileTypeMostlyTQ2_0
case GGMLTypeIQ4_NL_4_4:
return GGUFFileTypeMostlyIQ4_NL_4_4
case GGMLTypeIQ4_NL_4_8:
return GGUFFileTypeMostlyIQ4_NL_4_8
case GGMLTypeIQ4_NL_8_8:
return GGUFFileTypeMostlyIQ4_NL_8_8
default:
}
return _GGUFFileTypeCount
Expand Down
4 changes: 4 additions & 0 deletions ggml.go
Original file line number Diff line number Diff line change
Expand Up @@ -62,6 +62,8 @@ const (
GGMLTypeTQ1_0
GGMLTypeTQ2_0
GGMLTypeIQ4_NL_4_4
GGMLTypeIQ4_NL_4_8
GGMLTypeIQ4_NL_8_8
_GGMLTypeCount // Unknown
)

Expand Down Expand Up @@ -104,6 +106,8 @@ var _GGMLTypeTraits = map[GGMLType]GGMLTypeTrait{
GGMLTypeTQ1_0: {BlockSize: 256, TypeSize: 54, Quantized: true},
GGMLTypeTQ2_0: {BlockSize: 256, TypeSize: 66, Quantized: true},
GGMLTypeIQ4_NL_4_4: {BlockSize: 32, TypeSize: 18, Quantized: true},
GGMLTypeIQ4_NL_4_8: {BlockSize: 32, TypeSize: 18, Quantized: true},
GGMLTypeIQ4_NL_8_8: {BlockSize: 32, TypeSize: 18, Quantized: true},
}

// Trait returns the GGMLTypeTrait of the GGMLType.
Expand Down
8 changes: 5 additions & 3 deletions zz_generated.ggmltype.stringer.go

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

8 changes: 5 additions & 3 deletions zz_generated.gguffiletype.stringer.go

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

0 comments on commit 0634e74

Please sign in to comment.