add format bytes

This commit is contained in:
Michael Yang
2023-10-11 10:55:07 -07:00
parent aca2d65b82
commit b599946b74
4 changed files with 36 additions and 20 deletions

View File

@@ -454,7 +454,7 @@ type PredictRequest struct {
Stop []string `json:"stop,omitempty"`
}
const maxBufferSize = 512 * 1024 // 512KB
const maxBufferSize = 512 * 1000 // 512KB
func (llm *llama) Predict(ctx context.Context, prevContext []int, prompt string, fn func(api.GenerateResponse)) error {
prevConvo, err := llm.Decode(ctx, prevContext)