llama: remove model loading for grammar (#10096)

2025-05-11 10:26:53 +02:00 · 2025-04-24 11:51:19 -07:00 · 2025-04-24 11:51:19 -07:00 · a53d744b01
commit a53d744b01
parent 40b10eee6d
13 changed files with 521 additions and 107 deletions
--- a/model/process_text.go
+++ b/model/process_text.go
@ -32,6 +32,7 @@ type TextProcessor interface {
 	Encode(s string, addSpecial bool) ([]int32, error)
 	Decode([]int32) (string, error)
 	Is(int32, Special) bool
+	Vocabulary() *Vocabulary
 }

 type Vocabulary struct {
@ -117,6 +118,8 @@ type BytePairEncoding struct {
 	vocab *Vocabulary
 }

+var _ TextProcessor = (*BytePairEncoding)(nil)
+
 func NewBytePairEncoding(pre string, vocab *Vocabulary) BytePairEncoding {
 	return BytePairEncoding{
 		pre:   regexp2.MustCompile(pre, regexp2.Unicode|regexp2.RE2),
@ -124,6 +127,10 @@ func NewBytePairEncoding(pre string, vocab *Vocabulary) BytePairEncoding {
 	}
 }

+func (bpe BytePairEncoding) Vocabulary() *Vocabulary {
+	return bpe.vocab
+}
+
 func (bpe BytePairEncoding) Is(id int32, special Special) bool {
 	return bpe.vocab.Is(id, special)
 }